diff --git a/.gitattributes b/.gitattributes index a6344aac8c09253b3b630fb776ae94478aa0275b..52373fe24473b1aa44333d318f578ae6bf04b49b 100644 --- a/.gitattributes +++ b/.gitattributes @@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text +tokenizer.json filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000000000000000000000000000000000000..4c192fb495da2b7b34030deda13f226c99060650 --- /dev/null +++ b/README.md @@ -0,0 +1,57 @@ +--- +language: +- en +- zh +library_name: transformers +license: mit +pipeline_tag: text-generation +--- + +# GLM-4.6-FP8 + +
+ +
+

+ ๐Ÿ‘‹ Join our Discord community. +
+ ๐Ÿ“– Check out the GLM-4.6 technical blog, technical report(GLM-4.5), and Zhipu AI technical documentation. +
+ ๐Ÿ“ Use GLM-4.6 API services on Z.ai API Platform. +
+ ๐Ÿ‘‰ One click to GLM-4.6. +

+ +## Model Introduction + +Compared with GLM-4.5, **GLM-4.6** brings several key improvements: + +* **Longer context window:** The context window has been expanded from 128K to 200K tokens, enabling the model to handle more complex agentic tasks. +* **Superior coding performance:** The model achieves higher scores on code benchmarks and demonstrates better real-world performance in applications such as Claude Codeใ€Clineใ€Roo Code and Kilo Code, including improvements in generating visually polished front-end pages. +* **Advanced reasoning:** GLM-4.6 shows a clear improvement in reasoning performance and supports tool use during inference, leading to stronger overall capability. +* **More capable agents:** GLM-4.6 exhibits stronger performance in tool using and search-based agents, and integrates more effectively within agent frameworks. +* **Refined writing:** Better aligns with human preferences in style and readability, and performs more naturally in role-playing scenarios. + +We evaluated GLM-4.6 across eight public benchmarks covering agents, reasoning, and coding. Results show clear gains over GLM-4.5, with GLM-4.6 also holding competitive advantages over leading domestic and international models such as **DeepSeek-V3.1-Terminus** and **Claude Sonnet 4**. + +![bench](https://raw.githubusercontent.com/zai-org/GLM-4.5/refs/heads/main/resources/bench_glm46.png) + +## Inference + +**Both GLM-4.5 and GLM-4.6 use the same inference method.** + +you can check our [github](https://github.com/zai-org/GLM-4.5) for more detail. + +## Recommended Evaluation Parameters + +For general evaluations, we recommend using a **sampling temperature of 1.0**. + +For **code-related evaluation tasks** (such as LCB), it is further recommended to set: + +- `top_p = 0.95` +- `top_k = 40` + +## Evaluation + +- For tool-integrated reasoning, please refer to [this doc](https://github.com/zai-org/GLM-4.5/blob/main/resources/glm_4.6_tir_guide.md). +- For search benchmark, we design a specific format for searching toolcall in thinking mode to support search agent, please refer to [this](https://github.com/zai-org/GLM-4.5/blob/main/resources/trajectory_search.json). for the detailed template. diff --git a/chat_template.jinja b/chat_template.jinja new file mode 100644 index 0000000000000000000000000000000000000000..41478957aca7a04b7321022e7d1f73de5badd995 --- /dev/null +++ b/chat_template.jinja @@ -0,0 +1,103 @@ +[gMASK] +{%- if tools -%} +<|system|> +# Tools + +You may call one or more functions to assist with the user query. + +You are provided with function signatures within XML tags: + +{% for tool in tools %} +{{ tool | tojson(ensure_ascii=False) }} +{% endfor %} + + +For each function call, output the function name and arguments within the following XML format: +{function-name} +{arg-key-1} +{arg-value-1} +{arg-key-2} +{arg-value-2} +... +{%- endif -%} +{%- macro visible_text(content) -%} + {%- if content is string -%} + {{- content }} + {%- elif content is iterable and content is not mapping -%} + {%- for item in content -%} + {%- if item is mapping and item.type == 'text' -%} + {{- item.text }} + {%- elif item is string -%} + {{- item }} + {%- endif -%} + {%- endfor -%} + {%- else -%} + {{- content }} + {%- endif -%} +{%- endmacro -%} +{%- set ns = namespace(last_user_index=-1) %} +{%- for m in messages %} + {%- if m.role == 'user' %} + {% set ns.last_user_index = loop.index0 -%} + {%- endif %} +{%- endfor %} +{% for m in messages %} +{%- if m.role == 'user' -%}<|user|> +{{ visible_text(m.content) }} +{{- '/nothink' if (enable_thinking is defined and not enable_thinking and not visible_text(m.content).endswith("/nothink")) else '' -}} +{%- elif m.role == 'assistant' -%} +<|assistant|> +{%- set reasoning_content = '' %} +{%- set content = visible_text(m.content) %} +{%- if m.reasoning_content is string %} + {%- set reasoning_content = m.reasoning_content %} +{%- else %} + {%- if '' in content %} + {%- set reasoning_content = content.split('')[0].rstrip('\n').split('')[-1].lstrip('\n') %} + {%- set content = content.split('')[-1].lstrip('\n') %} + {%- endif %} +{%- endif %} +{%- if loop.index0 > ns.last_user_index and reasoning_content -%} +{{ '\n' + reasoning_content.strip() + ''}} +{%- else -%} +{{ '\n' }} +{%- endif -%} +{%- if content.strip() -%} +{{ '\n' + content.strip() }} +{%- endif -%} +{% if m.tool_calls %} +{% for tc in m.tool_calls %} +{%- if tc.function %} + {%- set tc = tc.function %} +{%- endif %} +{{ '\n' + tc.name }} +{% set _args = tc.arguments %} +{% for k, v in _args.items() %} +{{ k }} +{{ v | tojson(ensure_ascii=False) if v is not string else v }} +{% endfor %} +{% endfor %} +{% endif %} +{%- elif m.role == 'tool' -%} +{%- if m.content is string -%} +{%- if loop.first or (messages[loop.index0 - 1].role != "tool") %} + {{- '<|observation|>' }} +{%- endif %} +{{- '\n\n' }} +{{- m.content }} +{{- '\n' }} +{%- else -%} +<|observation|>{% for tr in m.content %} + + +{{ tr.output if tr.output is defined else tr }} +{% endfor -%} +{% endif -%} +{%- elif m.role == 'system' -%} +<|system|> +{{ visible_text(m.content) }} +{%- endif -%} +{%- endfor -%} +{%- if add_generation_prompt -%} + <|assistant|>{{- '\n' if (enable_thinking is defined and not enable_thinking) else '' -}} +{%- endif -%} \ No newline at end of file diff --git a/config.json b/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2583316dbdba4a193a7560a659add3461848eecd --- /dev/null +++ b/config.json @@ -0,0 +1,921 @@ +{ + "architectures": [ + "Glm4MoeForCausalLM" + ], + "attention_bias": true, + "attention_dropout": 0.0, + "pad_token_id": 151329, + "eos_token_id": [ + 151329, + 151336, + 151338 + ], + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 5120, + "partial_rotary_factor": 0.5, + "initializer_range": 0.02, + "intermediate_size": 12288, + "max_position_embeddings": 202752, + "model_type": "glm4_moe", + "moe_intermediate_size": 1536, + "norm_topk_prob": true, + "num_attention_heads": 96, + "n_group": 1, + "topk_group": 1, + "n_routed_experts": 160, + "n_shared_experts": 1, + "routed_scaling_factor": 2.5, + "num_experts_per_tok": 8, + "first_k_dense_replace": 3, + "num_hidden_layers": 92, + "num_key_value_heads": 8, + "rms_norm_eps": 1e-05, + "rope_scaling": null, + "rope_theta": 1000000, + "num_nextn_predict_layers": 1, + "tie_word_embeddings": false, + "torch_dtype": "bfloat16", + "transformers_version": "4.54.0", + "use_cache": true, + "use_qk_norm": true, + "vocab_size": 151552, + "quantization_config": { + "config_groups": { + "group_0": { + "input_activations": { + "actorder": null, + "block_structure": null, + "dynamic": true, + "group_size": null, + "num_bits": 8, + "observer": null, + "observer_kwargs": {}, + "strategy": "token", + "symmetric": true, + "type": "float" + }, + "output_activations": null, + "targets": [ + "Linear" + ], + "weights": { + "actorder": null, + "block_structure": null, + "dynamic": false, + "group_size": null, + "num_bits": 8, + "observer": "minmax", + "observer_kwargs": {}, + "strategy": "channel", + "symmetric": true, + "type": "float" + } + } + }, + "format": "float-quantized", + "ignore": [ + "model.layers.12.input_layernorm", + "model.layers.48.input_layernorm", + "model.layers.74.input_layernorm", + "model.layers.5.self_attn.q_norm", + "model.layers.11.self_attn.k_proj.bias", + "model.layers.3.self_attn.k_proj.bias", + "model.layers.53.self_attn.q_norm", + "model.layers.52.mlp.gate", + "model.layers.29.mlp.gate.e_score_correction_bias", + "model.layers.34.post_attention_layernorm", + "model.layers.88.post_attention_layernorm", + "model.layers.17.input_layernorm", + "model.layers.37.self_attn.k_norm", + "model.layers.9.mlp.gate.e_score_correction_bias", + "model.layers.17.self_attn.v_proj.bias", + "model.layers.82.self_attn.q_norm", + "model.layers.41.mlp.gate", + "model.layers.73.input_layernorm", + "model.layers.72.input_layernorm", + "model.layers.61.post_attention_layernorm", + "model.layers.30.input_layernorm", + "model.layers.80.mlp.gate", + "model.layers.14.input_layernorm", + "model.layers.45.self_attn.k_norm", + "model.layers.55.mlp.gate", + "model.layers.9.input_layernorm", + "model.layers.13.input_layernorm", + "model.layers.47.self_attn.q_proj.bias", + "model.layers.84.post_attention_layernorm", + "model.layers.85.self_attn.q_norm", + "model.layers.53.self_attn.v_proj.bias", + "model.layers.83.self_attn.v_proj.bias", + "model.layers.35.self_attn.v_proj.bias", + "model.layers.76.mlp.gate.e_score_correction_bias", + "model.layers.36.input_layernorm", + "model.layers.13.post_attention_layernorm", + "model.layers.71.self_attn.k_proj.bias", + "model.layers.84.mlp.gate.e_score_correction_bias", + "model.layers.46.self_attn.k_norm", + "model.layers.50.self_attn.q_norm", + "model.layers.59.self_attn.q_proj.bias", + "model.layers.5.input_layernorm", + "model.layers.29.mlp.gate", + "model.layers.73.self_attn.q_norm", + "model.layers.27.mlp.gate", + "model.layers.49.post_attention_layernorm", + "model.layers.63.self_attn.q_proj.bias", + "model.layers.7.self_attn.q_proj.bias", + "model.layers.5.self_attn.k_proj.bias", + "model.layers.70.self_attn.q_proj.bias", + "model.layers.70.self_attn.k_norm", + "model.layers.15.self_attn.q_proj.bias", + "model.layers.59.self_attn.q_norm", + "model.layers.89.self_attn.k_proj.bias", + "model.layers.89.self_attn.q_norm", + "model.layers.42.mlp.gate.e_score_correction_bias", + "model.layers.62.self_attn.q_norm", + "model.layers.18.input_layernorm", + "model.layers.79.post_attention_layernorm", + "model.layers.63.self_attn.k_norm", + "model.layers.58.input_layernorm", + "model.layers.57.mlp.gate", + "model.layers.32.self_attn.q_norm", + "model.layers.34.self_attn.v_proj.bias", + "model.layers.83.self_attn.k_proj.bias", + "model.layers.7.input_layernorm", + "model.layers.72.self_attn.k_norm", + "model.layers.55.self_attn.v_proj.bias", + "model.layers.2.self_attn.k_proj.bias", + "model.layers.23.post_attention_layernorm", + "model.layers.60.post_attention_layernorm", + "model.layers.33.self_attn.k_proj.bias", + "model.layers.85.self_attn.k_proj.bias", + "model.layers.83.mlp.gate.e_score_correction_bias", + "model.layers.20.self_attn.k_proj.bias", + "model.layers.11.mlp.gate", + "model.layers.82.input_layernorm", + "model.layers.83.self_attn.q_norm", + "model.layers.9.post_attention_layernorm", + "model.layers.55.mlp.gate.e_score_correction_bias", + "model.layers.21.mlp.gate", + "model.layers.41.mlp.gate.e_score_correction_bias", + "model.layers.10.mlp.gate.e_score_correction_bias", + "model.layers.49.mlp.gate", + "model.layers.56.self_attn.k_norm", + "model.layers.86.self_attn.q_norm", + "model.layers.89.input_layernorm", + "model.layers.16.input_layernorm", + "model.layers.25.mlp.gate.e_score_correction_bias", + "model.layers.8.self_attn.k_norm", + "model.layers.72.post_attention_layernorm", + "model.layers.92.self_attn.q_norm", + "model.layers.73.post_attention_layernorm", + "model.layers.71.mlp.gate.e_score_correction_bias", + "model.layers.42.input_layernorm", + "model.layers.25.self_attn.k_norm", + "model.layers.50.self_attn.q_proj.bias", + "model.layers.13.self_attn.k_norm", + "model.layers.65.mlp.gate.e_score_correction_bias", + "model.layers.9.self_attn.k_norm", + "model.layers.3.input_layernorm", + "model.layers.90.self_attn.q_proj.bias", + "model.layers.35.self_attn.q_norm", + "model.layers.74.mlp.gate", + "model.layers.21.self_attn.k_norm", + "model.layers.92.mlp.gate", + "model.layers.15.mlp.gate.e_score_correction_bias", + "model.layers.61.self_attn.k_proj.bias", + "model.layers.63.self_attn.q_norm", + "model.layers.73.self_attn.q_proj.bias", + "model.layers.18.self_attn.q_norm", + "model.layers.45.mlp.gate", + "model.layers.52.self_attn.v_proj.bias", + "model.layers.22.post_attention_layernorm", + "model.layers.85.self_attn.q_proj.bias", + "model.layers.3.self_attn.k_norm", + "model.layers.54.self_attn.v_proj.bias", + "model.layers.79.self_attn.v_proj.bias", + "model.layers.31.self_attn.q_proj.bias", + "model.layers.2.input_layernorm", + "model.layers.57.self_attn.q_norm", + "model.layers.65.self_attn.k_norm", + "model.layers.60.input_layernorm", + "model.layers.70.self_attn.v_proj.bias", + "model.layers.87.post_attention_layernorm", + "model.layers.83.post_attention_layernorm", + "model.layers.51.self_attn.k_proj.bias", + "model.layers.23.self_attn.k_norm", + "model.layers.49.self_attn.k_norm", + "model.layers.76.self_attn.k_proj.bias", + "model.layers.7.self_attn.q_norm", + "model.layers.54.mlp.gate", + "model.layers.63.post_attention_layernorm", + "model.layers.27.self_attn.k_proj.bias", + "model.layers.81.input_layernorm", + "model.layers.66.post_attention_layernorm", + "model.layers.84.self_attn.q_proj.bias", + "model.layers.36.self_attn.k_proj.bias", + "model.layers.30.self_attn.v_proj.bias", + "model.layers.48.self_attn.k_norm", + "model.layers.62.mlp.gate", + "model.layers.8.mlp.gate", + "model.layers.11.mlp.gate.e_score_correction_bias", + "model.layers.28.mlp.gate", + "model.layers.30.mlp.gate.e_score_correction_bias", + "model.layers.43.input_layernorm", + "model.layers.3.self_attn.q_proj.bias", + "model.layers.88.input_layernorm", + "model.layers.5.post_attention_layernorm", + "model.layers.35.self_attn.k_norm", + "model.layers.56.post_attention_layernorm", + "model.layers.30.mlp.gate", + "model.layers.67.self_attn.q_proj.bias", + "model.layers.58.post_attention_layernorm", + "model.layers.80.post_attention_layernorm", + "model.layers.88.self_attn.v_proj.bias", + "model.layers.90.self_attn.v_proj.bias", + "model.layers.2.self_attn.k_norm", + "model.layers.67.mlp.gate.e_score_correction_bias", + "model.layers.31.input_layernorm", + "model.layers.26.post_attention_layernorm", + "model.layers.81.self_attn.k_proj.bias", + "model.layers.51.self_attn.q_norm", + "model.layers.7.self_attn.k_proj.bias", + "model.layers.76.self_attn.q_proj.bias", + "model.layers.1.self_attn.k_norm", + "model.layers.34.mlp.gate.e_score_correction_bias", + "model.layers.80.self_attn.k_proj.bias", + "model.layers.0.self_attn.k_norm", + "model.layers.44.self_attn.q_norm", + "model.layers.29.input_layernorm", + "model.layers.77.self_attn.v_proj.bias", + "model.layers.73.mlp.gate", + "model.layers.31.self_attn.v_proj.bias", + "model.layers.46.self_attn.q_proj.bias", + "model.layers.62.self_attn.k_norm", + "model.layers.87.self_attn.k_proj.bias", + "model.layers.58.self_attn.k_norm", + "model.layers.66.mlp.gate.e_score_correction_bias", + "model.layers.32.mlp.gate.e_score_correction_bias", + "model.layers.73.self_attn.k_proj.bias", + "model.layers.85.mlp.gate.e_score_correction_bias", + "model.layers.23.mlp.gate", + "model.layers.72.self_attn.q_proj.bias", + "model.layers.25.mlp.gate", + "model.layers.43.mlp.gate.e_score_correction_bias", + "model.layers.50.mlp.gate.e_score_correction_bias", + "model.layers.6.mlp.gate.e_score_correction_bias", + "model.layers.14.mlp.gate", + "model.layers.50.self_attn.v_proj.bias", + "model.layers.33.self_attn.k_norm", + "model.layers.92.self_attn.q_proj.bias", + "model.layers.6.self_attn.k_proj.bias", + "model.layers.43.mlp.gate", + "model.layers.68.self_attn.q_proj.bias", + "model.layers.33.self_attn.v_proj.bias", + "model.layers.41.self_attn.k_norm", + "model.layers.32.self_attn.k_norm", + "model.layers.28.post_attention_layernorm", + "model.layers.61.self_attn.v_proj.bias", + "model.layers.16.post_attention_layernorm", + "model.layers.48.mlp.gate.e_score_correction_bias", + "model.layers.4.self_attn.v_proj.bias", + "model.layers.88.self_attn.k_norm", + "model.layers.68.self_attn.k_norm", + "model.layers.77.self_attn.q_proj.bias", + "model.layers.8.self_attn.v_proj.bias", + "model.layers.20.mlp.gate.e_score_correction_bias", + "model.layers.86.self_attn.k_norm", + "model.layers.36.self_attn.v_proj.bias", + "model.layers.71.input_layernorm", + "model.layers.72.mlp.gate", + "model.layers.24.self_attn.k_norm", + "model.layers.20.self_attn.q_norm", + "model.layers.62.post_attention_layernorm", + "model.layers.3.self_attn.v_proj.bias", + "model.layers.25.input_layernorm", + "model.layers.20.self_attn.v_proj.bias", + "model.layers.64.self_attn.v_proj.bias", + "model.layers.19.self_attn.k_proj.bias", + "model.layers.63.mlp.gate.e_score_correction_bias", + "model.layers.92.embed_tokens", + "model.layers.62.self_attn.q_proj.bias", + "model.layers.69.self_attn.q_norm", + "model.layers.9.mlp.gate", + "model.layers.62.mlp.gate.e_score_correction_bias", + "model.layers.35.self_attn.k_proj.bias", + "model.layers.1.self_attn.q_proj.bias", + "model.layers.40.self_attn.q_norm", + "model.layers.26.input_layernorm", + "model.layers.50.self_attn.k_proj.bias", + "model.layers.39.input_layernorm", + "model.layers.28.self_attn.k_proj.bias", + "model.layers.39.self_attn.q_proj.bias", + "model.layers.5.mlp.gate", + "model.layers.56.input_layernorm", + "model.layers.60.self_attn.k_norm", + "model.layers.76.self_attn.q_norm", + "lm_head", + "model.layers.69.self_attn.k_norm", + "model.layers.23.self_attn.q_proj.bias", + "model.layers.58.self_attn.q_proj.bias", + "model.norm", + "model.layers.53.self_attn.k_proj.bias", + "model.layers.73.self_attn.v_proj.bias", + "model.layers.33.self_attn.q_proj.bias", + "model.layers.64.input_layernorm", + "model.layers.15.mlp.gate", + "model.layers.55.self_attn.q_proj.bias", + "model.layers.55.self_attn.k_norm", + "model.layers.27.mlp.gate.e_score_correction_bias", + "model.layers.68.input_layernorm", + "model.layers.30.self_attn.q_norm", + "model.layers.82.post_attention_layernorm", + "model.layers.29.self_attn.q_proj.bias", + "model.layers.79.self_attn.k_proj.bias", + "model.layers.16.self_attn.k_proj.bias", + "model.layers.71.self_attn.k_norm", + "model.layers.16.self_attn.k_norm", + "model.layers.75.self_attn.k_proj.bias", + "model.layers.52.self_attn.q_norm", + "model.layers.87.self_attn.v_proj.bias", + "model.layers.23.self_attn.k_proj.bias", + "model.layers.24.post_attention_layernorm", + "model.layers.40.self_attn.q_proj.bias", + "model.layers.46.mlp.gate.e_score_correction_bias", + "model.layers.54.input_layernorm", + "model.layers.75.post_attention_layernorm", + "model.layers.72.self_attn.k_proj.bias", + "model.layers.82.self_attn.q_proj.bias", + "model.layers.75.mlp.gate.e_score_correction_bias", + "model.layers.27.self_attn.q_norm", + "model.layers.39.self_attn.q_norm", + "model.layers.45.self_attn.k_proj.bias", + "model.layers.90.self_attn.k_proj.bias", + "model.layers.65.self_attn.q_proj.bias", + "model.layers.5.self_attn.k_norm", + "model.layers.89.self_attn.q_proj.bias", + "model.layers.10.self_attn.k_proj.bias", + "model.layers.86.self_attn.v_proj.bias", + "model.layers.89.mlp.gate.e_score_correction_bias", + "model.layers.42.self_attn.k_norm", + "model.layers.57.self_attn.k_proj.bias", + "model.layers.68.post_attention_layernorm", + "model.layers.1.self_attn.v_proj.bias", + "model.layers.38.self_attn.k_proj.bias", + "model.layers.75.self_attn.v_proj.bias", + "model.layers.44.self_attn.q_proj.bias", + "model.layers.8.mlp.gate.e_score_correction_bias", + "model.layers.55.input_layernorm", + "model.layers.7.self_attn.v_proj.bias", + "model.layers.51.self_attn.k_norm", + "model.layers.19.mlp.gate", + "model.layers.12.self_attn.q_norm", + "model.layers.78.self_attn.k_norm", + "model.layers.61.self_attn.q_norm", + "model.layers.18.mlp.gate", + "model.layers.8.self_attn.q_norm", + "model.layers.7.self_attn.k_norm", + "model.layers.84.self_attn.q_norm", + "model.layers.44.self_attn.k_proj.bias", + "model.layers.38.self_attn.q_proj.bias", + "model.layers.37.mlp.gate.e_score_correction_bias", + "model.layers.34.mlp.gate", + "model.layers.92.eh_proj", + "model.layers.75.self_attn.q_proj.bias", + "model.layers.61.mlp.gate.e_score_correction_bias", + "model.layers.33.mlp.gate.e_score_correction_bias", + "model.layers.81.mlp.gate.e_score_correction_bias", + "model.layers.47.self_attn.k_proj.bias", + "model.layers.72.self_attn.q_norm", + "model.layers.62.self_attn.k_proj.bias", + "model.layers.33.self_attn.q_norm", + "model.layers.24.mlp.gate", + "model.layers.51.input_layernorm", + "model.layers.42.self_attn.k_proj.bias", + "model.layers.43.self_attn.k_norm", + "model.layers.46.self_attn.k_proj.bias", + "model.layers.66.input_layernorm", + "model.layers.31.mlp.gate.e_score_correction_bias", + "model.layers.77.post_attention_layernorm", + "model.layers.52.self_attn.k_norm", + "model.layers.4.mlp.gate", + "model.layers.51.post_attention_layernorm", + "model.layers.15.self_attn.k_norm", + "model.layers.60.self_attn.k_proj.bias", + "model.layers.6.self_attn.q_norm", + "model.layers.85.mlp.gate", + "model.layers.66.self_attn.k_norm", + "model.layers.22.self_attn.v_proj.bias", + "model.layers.36.self_attn.k_norm", + "model.layers.8.input_layernorm", + "model.layers.19.mlp.gate.e_score_correction_bias", + "model.layers.25.self_attn.k_proj.bias", + "model.layers.31.self_attn.q_norm", + "model.layers.16.mlp.gate.e_score_correction_bias", + "model.layers.57.self_attn.v_proj.bias", + "model.layers.35.mlp.gate", + "model.layers.75.input_layernorm", + "model.layers.2.self_attn.v_proj.bias", + "model.layers.9.self_attn.v_proj.bias", + "model.layers.80.self_attn.q_proj.bias", + "model.layers.19.self_attn.v_proj.bias", + "model.layers.4.post_attention_layernorm", + "model.layers.65.input_layernorm", + "model.layers.82.mlp.gate.e_score_correction_bias", + "model.layers.69.post_attention_layernorm", + "model.layers.21.self_attn.q_norm", + "model.layers.18.post_attention_layernorm", + "model.layers.81.self_attn.q_proj.bias", + "model.layers.77.input_layernorm", + "model.layers.17.self_attn.q_norm", + "model.layers.80.input_layernorm", + "model.layers.13.mlp.gate.e_score_correction_bias", + "model.layers.0.post_attention_layernorm", + "model.layers.19.post_attention_layernorm", + "model.layers.91.self_attn.v_proj.bias", + "model.layers.77.mlp.gate", + "model.layers.11.self_attn.q_norm", + "model.layers.92.hnorm", + "model.layers.11.self_attn.q_proj.bias", + "model.layers.47.self_attn.q_norm", + "model.layers.42.self_attn.v_proj.bias", + "model.layers.90.input_layernorm", + "model.layers.78.input_layernorm", + "model.layers.11.self_attn.v_proj.bias", + "model.layers.80.self_attn.q_norm", + "model.layers.83.input_layernorm", + "model.layers.43.self_attn.q_norm", + "model.layers.91.post_attention_layernorm", + "model.layers.50.mlp.gate", + "model.layers.48.self_attn.k_proj.bias", + "model.layers.70.mlp.gate.e_score_correction_bias", + "model.layers.14.self_attn.q_proj.bias", + "model.layers.31.self_attn.k_proj.bias", + "model.layers.47.self_attn.v_proj.bias", + "model.layers.12.self_attn.k_proj.bias", + "model.layers.12.mlp.gate", + "model.layers.34.self_attn.q_norm", + "model.layers.62.self_attn.v_proj.bias", + "model.layers.26.mlp.gate.e_score_correction_bias", + "model.layers.45.mlp.gate.e_score_correction_bias", + "model.layers.77.self_attn.q_norm", + "model.layers.47.self_attn.k_norm", + "model.layers.53.post_attention_layernorm", + "model.layers.7.post_attention_layernorm", + "model.layers.90.post_attention_layernorm", + "model.layers.40.mlp.gate.e_score_correction_bias", + "model.layers.63.input_layernorm", + "model.layers.52.mlp.gate.e_score_correction_bias", + "model.layers.92.input_layernorm", + "model.layers.44.self_attn.v_proj.bias", + "model.layers.46.mlp.gate", + "model.layers.18.self_attn.k_proj.bias", + "model.layers.62.input_layernorm", + "model.layers.24.self_attn.v_proj.bias", + "model.layers.40.post_attention_layernorm", + "model.layers.8.post_attention_layernorm", + "model.layers.82.mlp.gate", + "model.layers.17.post_attention_layernorm", + "model.layers.45.self_attn.v_proj.bias", + "model.layers.84.self_attn.k_proj.bias", + "model.layers.15.self_attn.k_proj.bias", + "model.layers.0.self_attn.q_proj.bias", + "model.layers.92.shared_head.norm", + "model.layers.51.self_attn.q_proj.bias", + "model.layers.22.mlp.gate", + "model.layers.4.self_attn.k_norm", + "model.layers.84.input_layernorm", + "model.layers.30.self_attn.k_proj.bias", + "model.layers.12.self_attn.v_proj.bias", + "model.layers.37.input_layernorm", + "model.layers.37.self_attn.q_norm", + "model.layers.45.self_attn.q_norm", + "model.layers.72.self_attn.v_proj.bias", + "model.layers.64.self_attn.k_norm", + "model.layers.43.self_attn.k_proj.bias", + "model.layers.38.mlp.gate.e_score_correction_bias", + "model.layers.79.input_layernorm", + "model.layers.48.mlp.gate", + "model.layers.52.self_attn.q_proj.bias", + "model.layers.46.self_attn.v_proj.bias", + "model.layers.81.mlp.gate", + "model.layers.71.self_attn.q_proj.bias", + "model.layers.50.self_attn.k_norm", + "model.layers.18.self_attn.v_proj.bias", + "model.layers.53.input_layernorm", + "model.layers.64.self_attn.q_proj.bias", + "model.layers.12.self_attn.k_norm", + "model.embed_tokens", + "model.layers.78.self_attn.k_proj.bias", + "model.layers.40.self_attn.k_norm", + "model.layers.11.input_layernorm", + "model.layers.22.input_layernorm", + "model.layers.39.mlp.gate", + "model.layers.30.self_attn.k_norm", + "model.layers.71.mlp.gate", + "model.layers.71.post_attention_layernorm", + "model.layers.78.self_attn.q_norm", + "model.layers.87.mlp.gate", + "model.layers.14.self_attn.q_norm", + "model.layers.42.post_attention_layernorm", + "model.layers.3.post_attention_layernorm", + "model.layers.92.self_attn.k_proj.bias", + "model.layers.3.mlp.gate", + "model.layers.89.mlp.gate", + "model.layers.86.self_attn.k_proj.bias", + "model.layers.87.self_attn.q_proj.bias", + "model.layers.63.self_attn.k_proj.bias", + "model.layers.87.input_layernorm", + "model.layers.10.self_attn.q_proj.bias", + "model.layers.81.post_attention_layernorm", + "model.layers.39.self_attn.v_proj.bias", + "model.layers.43.post_attention_layernorm", + "model.layers.76.mlp.gate", + "model.layers.28.self_attn.v_proj.bias", + "model.layers.57.self_attn.q_proj.bias", + "model.layers.21.mlp.gate.e_score_correction_bias", + "model.layers.75.self_attn.q_norm", + "model.layers.58.self_attn.k_proj.bias", + "model.layers.52.input_layernorm", + "model.layers.0.self_attn.k_proj.bias", + "model.layers.78.mlp.gate.e_score_correction_bias", + "model.layers.85.self_attn.k_norm", + "model.layers.42.self_attn.q_norm", + "model.layers.25.self_attn.v_proj.bias", + "model.layers.36.post_attention_layernorm", + "model.layers.4.self_attn.q_norm", + "model.layers.16.self_attn.q_norm", + "model.layers.41.self_attn.k_proj.bias", + "model.layers.5.self_attn.q_proj.bias", + "model.layers.28.self_attn.q_norm", + "model.layers.41.self_attn.q_proj.bias", + "model.layers.68.mlp.gate.e_score_correction_bias", + "model.layers.26.self_attn.k_proj.bias", + "model.layers.86.input_layernorm", + "model.layers.35.mlp.gate.e_score_correction_bias", + "model.layers.69.input_layernorm", + "model.layers.77.mlp.gate.e_score_correction_bias", + "model.layers.10.self_attn.q_norm", + "model.layers.32.post_attention_layernorm", + "model.layers.54.self_attn.q_norm", + "model.layers.45.post_attention_layernorm", + "model.layers.45.input_layernorm", + "model.layers.15.post_attention_layernorm", + "model.layers.64.post_attention_layernorm", + "model.layers.15.self_attn.v_proj.bias", + "model.layers.24.self_attn.k_proj.bias", + "model.layers.64.self_attn.k_proj.bias", + "model.layers.14.post_attention_layernorm", + "model.layers.40.mlp.gate", + "model.layers.50.input_layernorm", + "model.layers.21.self_attn.v_proj.bias", + "model.layers.66.self_attn.q_proj.bias", + "model.layers.78.mlp.gate", + "model.layers.2.self_attn.q_proj.bias", + "model.layers.12.self_attn.q_proj.bias", + "model.layers.7.mlp.gate", + "model.layers.35.post_attention_layernorm", + "model.layers.52.post_attention_layernorm", + "model.layers.30.post_attention_layernorm", + "model.layers.59.input_layernorm", + "model.layers.86.post_attention_layernorm", + "model.layers.0.self_attn.v_proj.bias", + "model.layers.24.mlp.gate.e_score_correction_bias", + "model.layers.34.self_attn.k_norm", + "model.layers.4.self_attn.k_proj.bias", + "model.layers.74.self_attn.q_proj.bias", + "model.layers.78.self_attn.v_proj.bias", + "model.layers.49.self_attn.q_proj.bias", + "model.layers.53.mlp.gate.e_score_correction_bias", + "model.layers.60.self_attn.v_proj.bias", + "model.layers.59.mlp.gate", + "model.layers.61.mlp.gate", + "model.layers.26.self_attn.q_norm", + "model.layers.1.input_layernorm", + "model.layers.33.mlp.gate", + "model.layers.91.mlp.gate", + "model.layers.26.self_attn.q_proj.bias", + "model.layers.83.mlp.gate", + "model.layers.12.mlp.gate.e_score_correction_bias", + "model.layers.36.self_attn.q_norm", + "model.layers.91.mlp.gate.e_score_correction_bias", + "model.layers.25.self_attn.q_norm", + "model.layers.91.self_attn.k_norm", + "model.layers.20.self_attn.k_norm", + "model.layers.8.self_attn.k_proj.bias", + "model.layers.29.self_attn.v_proj.bias", + "model.layers.82.self_attn.k_proj.bias", + "model.layers.89.post_attention_layernorm", + "model.layers.29.self_attn.k_norm", + "model.layers.88.self_attn.q_norm", + "model.layers.48.self_attn.q_proj.bias", + "model.layers.22.self_attn.k_norm", + "model.layers.27.self_attn.q_proj.bias", + "model.layers.23.mlp.gate.e_score_correction_bias", + "model.layers.1.post_attention_layernorm", + "model.layers.29.post_attention_layernorm", + "model.layers.58.mlp.gate", + "model.layers.27.input_layernorm", + "model.layers.66.self_attn.k_proj.bias", + "model.layers.87.mlp.gate.e_score_correction_bias", + "model.layers.22.self_attn.q_norm", + "model.layers.4.mlp.gate.e_score_correction_bias", + "model.layers.51.mlp.gate", + "model.layers.90.mlp.gate.e_score_correction_bias", + "model.layers.3.self_attn.q_norm", + "model.layers.33.input_layernorm", + "model.layers.91.self_attn.k_proj.bias", + "model.layers.8.self_attn.q_proj.bias", + "model.layers.12.post_attention_layernorm", + "model.layers.3.mlp.gate.e_score_correction_bias", + "model.layers.69.mlp.gate.e_score_correction_bias", + "model.layers.17.self_attn.k_proj.bias", + "model.layers.82.self_attn.k_norm", + "model.layers.10.post_attention_layernorm", + "model.layers.84.mlp.gate", + "model.layers.6.input_layernorm", + "model.layers.70.mlp.gate", + "model.layers.33.post_attention_layernorm", + "model.layers.31.self_attn.k_norm", + "model.layers.88.self_attn.q_proj.bias", + "model.layers.80.self_attn.k_norm", + "model.layers.36.mlp.gate.e_score_correction_bias", + "model.layers.56.self_attn.v_proj.bias", + "model.layers.1.self_attn.k_proj.bias", + "model.layers.44.self_attn.k_norm", + "model.layers.60.mlp.gate.e_score_correction_bias", + "model.layers.32.self_attn.k_proj.bias", + "model.layers.69.self_attn.k_proj.bias", + "model.layers.4.input_layernorm", + "model.layers.15.self_attn.q_norm", + "model.layers.79.self_attn.k_norm", + "model.layers.4.self_attn.q_proj.bias", + "model.layers.51.mlp.gate.e_score_correction_bias", + "model.layers.57.self_attn.k_norm", + "model.layers.90.self_attn.k_norm", + "model.layers.27.self_attn.k_norm", + "model.layers.50.post_attention_layernorm", + "model.layers.21.self_attn.q_proj.bias", + "model.layers.10.input_layernorm", + "model.layers.64.self_attn.q_norm", + "model.layers.67.self_attn.k_proj.bias", + "model.layers.85.self_attn.v_proj.bias", + "model.layers.14.mlp.gate.e_score_correction_bias", + "model.layers.32.mlp.gate", + "model.layers.67.self_attn.v_proj.bias", + "model.layers.26.self_attn.k_norm", + "model.layers.19.self_attn.q_norm", + "model.layers.22.mlp.gate.e_score_correction_bias", + "model.layers.68.self_attn.q_norm", + "model.layers.86.mlp.gate.e_score_correction_bias", + "model.layers.20.post_attention_layernorm", + "model.layers.21.post_attention_layernorm", + "model.layers.49.self_attn.v_proj.bias", + "model.layers.38.mlp.gate", + "model.layers.82.self_attn.v_proj.bias", + "model.layers.42.mlp.gate", + "model.layers.21.input_layernorm", + "model.layers.22.self_attn.k_proj.bias", + "model.layers.54.self_attn.q_proj.bias", + "model.layers.76.post_attention_layernorm", + "model.layers.67.input_layernorm", + "model.layers.65.self_attn.v_proj.bias", + "model.layers.67.self_attn.q_norm", + "model.layers.79.self_attn.q_norm", + "model.layers.47.input_layernorm", + "model.layers.79.mlp.gate.e_score_correction_bias", + "model.layers.76.self_attn.k_norm", + "model.layers.60.mlp.gate", + "model.layers.20.self_attn.q_proj.bias", + "model.layers.11.post_attention_layernorm", + "model.layers.24.self_attn.q_norm", + "model.layers.53.self_attn.k_norm", + "model.layers.53.self_attn.q_proj.bias", + "model.layers.75.self_attn.k_norm", + "model.layers.28.self_attn.q_proj.bias", + "model.layers.65.self_attn.q_norm", + "model.layers.39.self_attn.k_proj.bias", + "model.layers.85.input_layernorm", + "model.layers.17.self_attn.q_proj.bias", + "model.layers.65.post_attention_layernorm", + "model.layers.68.mlp.gate", + "model.layers.13.self_attn.q_norm", + "model.layers.81.self_attn.v_proj.bias", + "model.layers.58.self_attn.q_norm", + "model.layers.34.input_layernorm", + "model.layers.25.self_attn.q_proj.bias", + "model.layers.77.self_attn.k_proj.bias", + "model.layers.39.mlp.gate.e_score_correction_bias", + "model.layers.0.input_layernorm", + "model.layers.76.self_attn.v_proj.bias", + "model.layers.6.self_attn.k_norm", + "model.layers.74.self_attn.k_proj.bias", + "model.layers.92.self_attn.k_norm", + "model.layers.37.self_attn.k_proj.bias", + "model.layers.18.self_attn.k_norm", + "model.layers.48.self_attn.q_norm", + "model.layers.84.self_attn.v_proj.bias", + "model.layers.47.mlp.gate.e_score_correction_bias", + "model.layers.49.self_attn.q_norm", + "model.layers.51.self_attn.v_proj.bias", + "model.layers.61.input_layernorm", + "model.layers.28.self_attn.k_norm", + "model.layers.32.self_attn.v_proj.bias", + "model.layers.55.self_attn.q_norm", + "model.layers.55.self_attn.k_proj.bias", + "model.layers.47.post_attention_layernorm", + "model.layers.69.self_attn.q_proj.bias", + "model.layers.28.input_layernorm", + "model.layers.40.self_attn.v_proj.bias", + "model.layers.19.input_layernorm", + "model.layers.83.self_attn.q_proj.bias", + "model.layers.66.self_attn.v_proj.bias", + "model.layers.59.mlp.gate.e_score_correction_bias", + "model.layers.23.self_attn.v_proj.bias", + "model.layers.0.self_attn.q_norm", + "model.layers.5.mlp.gate.e_score_correction_bias", + "model.layers.37.self_attn.v_proj.bias", + "model.layers.2.post_attention_layernorm", + "model.layers.5.self_attn.v_proj.bias", + "model.layers.34.self_attn.k_proj.bias", + "model.layers.38.self_attn.v_proj.bias", + "model.layers.81.self_attn.k_norm", + "model.layers.32.input_layernorm", + "model.layers.10.self_attn.k_norm", + "model.layers.54.self_attn.k_norm", + "model.layers.70.input_layernorm", + "model.layers.41.self_attn.v_proj.bias", + "model.layers.74.post_attention_layernorm", + "model.layers.35.input_layernorm", + "model.layers.7.mlp.gate.e_score_correction_bias", + "model.layers.6.post_attention_layernorm", + "model.layers.86.mlp.gate", + "model.layers.20.mlp.gate", + "model.layers.31.mlp.gate", + "model.layers.2.self_attn.q_norm", + "model.layers.23.self_attn.q_norm", + "model.layers.6.self_attn.q_proj.bias", + "model.layers.83.self_attn.k_norm", + "model.layers.38.input_layernorm", + "model.layers.60.self_attn.q_norm", + "model.layers.91.self_attn.q_norm", + "model.layers.44.input_layernorm", + "model.layers.67.post_attention_layernorm", + "model.layers.27.self_attn.v_proj.bias", + "model.layers.15.input_layernorm", + "model.layers.26.self_attn.v_proj.bias", + "model.layers.44.post_attention_layernorm", + "model.layers.46.self_attn.q_norm", + "model.layers.58.self_attn.v_proj.bias", + "model.layers.67.self_attn.k_norm", + "model.layers.38.self_attn.k_norm", + "model.layers.56.mlp.gate.e_score_correction_bias", + "model.layers.73.self_attn.k_norm", + "model.layers.80.mlp.gate.e_score_correction_bias", + "model.layers.37.self_attn.q_proj.bias", + "model.layers.17.mlp.gate", + "model.layers.19.self_attn.k_norm", + "model.layers.53.mlp.gate", + "model.layers.21.self_attn.k_proj.bias", + "model.layers.56.self_attn.q_norm", + "model.layers.59.self_attn.v_proj.bias", + "model.layers.64.mlp.gate.e_score_correction_bias", + "model.layers.86.self_attn.q_proj.bias", + "model.layers.46.input_layernorm", + "model.layers.6.mlp.gate", + "model.layers.40.self_attn.k_proj.bias", + "model.layers.60.self_attn.q_proj.bias", + "model.layers.6.self_attn.v_proj.bias", + "model.layers.47.mlp.gate", + "model.layers.32.self_attn.q_proj.bias", + "model.layers.17.mlp.gate.e_score_correction_bias", + "model.layers.29.self_attn.k_proj.bias", + "model.layers.44.mlp.gate.e_score_correction_bias", + "model.layers.57.mlp.gate.e_score_correction_bias", + "model.layers.87.self_attn.q_norm", + "model.layers.71.self_attn.q_norm", + "model.layers.52.self_attn.k_proj.bias", + "model.layers.88.mlp.gate.e_score_correction_bias", + "model.layers.68.self_attn.k_proj.bias", + "model.layers.16.self_attn.q_proj.bias", + "model.layers.48.self_attn.v_proj.bias", + "model.layers.74.self_attn.q_norm", + "model.layers.34.self_attn.q_proj.bias", + "model.layers.1.self_attn.q_norm", + "model.layers.63.mlp.gate", + "model.layers.92.enorm", + "model.layers.14.self_attn.v_proj.bias", + "model.layers.54.post_attention_layernorm", + "model.layers.41.self_attn.q_norm", + "model.layers.37.post_attention_layernorm", + "model.layers.61.self_attn.q_proj.bias", + "model.layers.91.input_layernorm", + "model.layers.11.self_attn.k_norm", + "model.layers.43.self_attn.q_proj.bias", + "model.layers.18.mlp.gate.e_score_correction_bias", + "model.layers.59.post_attention_layernorm", + "model.layers.9.self_attn.q_norm", + "model.layers.74.self_attn.k_norm", + "model.layers.43.self_attn.v_proj.bias", + "model.layers.49.self_attn.k_proj.bias", + "model.layers.56.self_attn.k_proj.bias", + "model.layers.14.self_attn.k_proj.bias", + "model.layers.65.mlp.gate", + "model.layers.56.self_attn.q_proj.bias", + "model.layers.24.self_attn.q_proj.bias", + "model.layers.71.self_attn.v_proj.bias", + "model.layers.54.mlp.gate.e_score_correction_bias", + "model.layers.39.post_attention_layernorm", + "model.layers.91.self_attn.q_proj.bias", + "model.layers.92.mlp.gate.e_score_correction_bias", + "model.layers.46.post_attention_layernorm", + "model.layers.92.self_attn.v_proj.bias", + "model.layers.63.self_attn.v_proj.bias", + "model.layers.25.post_attention_layernorm", + "model.layers.45.self_attn.q_proj.bias", + "model.layers.38.self_attn.q_norm", + "model.layers.68.self_attn.v_proj.bias", + "model.layers.69.mlp.gate", + "model.layers.84.self_attn.k_norm", + "model.layers.19.self_attn.q_proj.bias", + "model.layers.38.post_attention_layernorm", + "model.layers.44.mlp.gate", + "model.layers.70.post_attention_layernorm", + "model.layers.58.mlp.gate.e_score_correction_bias", + "model.layers.28.mlp.gate.e_score_correction_bias", + "model.layers.48.post_attention_layernorm", + "model.layers.36.self_attn.q_proj.bias", + "model.layers.66.self_attn.q_norm", + "model.layers.70.self_attn.k_proj.bias", + "model.layers.57.input_layernorm", + "model.layers.42.self_attn.q_proj.bias", + "model.layers.26.mlp.gate", + "model.layers.74.self_attn.v_proj.bias", + "model.layers.59.self_attn.k_proj.bias", + "model.layers.88.mlp.gate", + "model.layers.14.self_attn.k_norm", + "model.layers.88.self_attn.k_proj.bias", + "model.layers.35.self_attn.q_proj.bias", + "model.layers.65.self_attn.k_proj.bias", + "model.layers.18.self_attn.q_proj.bias", + "model.layers.30.self_attn.q_proj.bias", + "model.layers.29.self_attn.q_norm", + "model.layers.78.post_attention_layernorm", + "model.layers.79.mlp.gate", + "model.layers.27.post_attention_layernorm", + "model.layers.80.self_attn.v_proj.bias", + "model.layers.16.mlp.gate", + "model.layers.10.self_attn.v_proj.bias", + "model.layers.13.self_attn.v_proj.bias", + "model.layers.70.self_attn.q_norm", + "model.layers.73.mlp.gate.e_score_correction_bias", + "model.layers.41.post_attention_layernorm", + "model.layers.39.self_attn.k_norm", + "model.layers.10.mlp.gate", + "model.layers.36.mlp.gate", + "model.layers.92.post_attention_layernorm", + "model.layers.64.mlp.gate", + "model.layers.40.input_layernorm", + "model.layers.77.self_attn.k_norm", + "model.layers.31.post_attention_layernorm", + "model.layers.56.mlp.gate", + "model.layers.16.self_attn.v_proj.bias", + "model.layers.9.self_attn.q_proj.bias", + "model.layers.13.mlp.gate", + "model.layers.17.self_attn.k_norm", + "model.layers.22.self_attn.q_proj.bias", + "model.layers.49.mlp.gate.e_score_correction_bias", + "model.layers.9.self_attn.k_proj.bias", + "model.layers.37.mlp.gate", + "model.layers.72.mlp.gate.e_score_correction_bias", + "model.layers.90.self_attn.q_norm", + "model.layers.79.self_attn.q_proj.bias", + "model.layers.75.mlp.gate", + "model.layers.74.mlp.gate.e_score_correction_bias", + "model.layers.89.self_attn.v_proj.bias", + "model.layers.59.self_attn.k_norm", + "model.layers.76.input_layernorm", + "model.layers.66.mlp.gate", + "model.layers.55.post_attention_layernorm", + "model.layers.24.input_layernorm", + "model.layers.57.post_attention_layernorm", + "model.layers.23.input_layernorm", + "model.layers.67.mlp.gate", + "model.layers.13.self_attn.k_proj.bias", + "model.layers.69.self_attn.v_proj.bias", + "model.layers.85.post_attention_layernorm", + "model.layers.13.self_attn.q_proj.bias", + "model.layers.87.self_attn.k_norm", + "model.layers.89.self_attn.k_norm", + "model.layers.54.self_attn.k_proj.bias", + "model.layers.49.input_layernorm", + "model.layers.78.self_attn.q_proj.bias", + "model.layers.81.self_attn.q_norm", + "model.layers.41.input_layernorm", + "model.layers.90.mlp.gate", + "model.layers.61.self_attn.k_norm", + "model.layers.20.input_layernorm" + ], + "quant_method": "compressed-tensors", + "quantization_status": "compressed" + } +} diff --git a/generation_config.json b/generation_config.json new file mode 100644 index 0000000000000000000000000000000000000000..55942563772385555a04b7be7ce33240c1c2d15e --- /dev/null +++ b/generation_config.json @@ -0,0 +1,11 @@ +{ + "_from_model_config": true, + "eos_token_id": [ + 151329, + 151336, + 151338 + ], + "temperature": 1.0, + "pad_token_id": 151329, + "transformers_version": "4.54.0" +} diff --git a/model-00001-of-00092.safetensors b/model-00001-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..eef362e533b32930bbb8d08044d32651362f0085 --- /dev/null +++ b/model-00001-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b36a87481f296d0aa98385f964b7e39ba8b6b3de8d9233484a514b35062dbfec +size 1877199832 diff --git a/model-00002-of-00092.safetensors b/model-00002-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7d55fbe645f73bc7608d21922c8d275b2e4c455c --- /dev/null +++ b/model-00002-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4377353c9df8c7180bf0d4d876d0a567953a42388771ef110ae144392769555 +size 325307176 diff --git a/model-00003-of-00092.safetensors b/model-00003-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1a520a23fba5eb97e4511133027d8b3c0c2383cb --- /dev/null +++ b/model-00003-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:894d603e1bace165a158dfed52240a079b9261bfb5f727248c0387a6f7e3393f +size 325307176 diff --git a/model-00004-of-00092.safetensors b/model-00004-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9ced60dc38069a7ebe064e489ece8c4fffdc2dab --- /dev/null +++ b/model-00004-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cd3fbef0cdd05105dfdd460578e67127b80dd79d151e1595ea0e156548e7e96 +size 3941945016 diff --git a/model-00005-of-00092.safetensors b/model-00005-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7e67f14b903088457c2d8aba709d981f2d2e232e --- /dev/null +++ b/model-00005-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52cf9b585c448ef051051449f0298fbcbc564b0cd07477a6f81877105600fbac +size 3941945016 diff --git a/model-00006-of-00092.safetensors b/model-00006-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0f272d206a902c6091dac4417b5176577dab994d --- /dev/null +++ b/model-00006-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e42ba13d58a14833a5663ea6308de626e7ed2fce0112137a02c2aafa3618a17 +size 3941945016 diff --git a/model-00007-of-00092.safetensors b/model-00007-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3b54775853a1e94cd34f299ac855c4be2ed712e8 --- /dev/null +++ b/model-00007-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e18797a56cafdaa6af79ed015aeea3b0aaf64f81f502fe8e86b3350970cd7b91 +size 3941945016 diff --git a/model-00008-of-00092.safetensors b/model-00008-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..14788b8aeabab277a400b54bfa5dc81cd99f56f3 --- /dev/null +++ b/model-00008-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e9f10b8d1ca2a14385fc68c0e3a3afa3c92e7257b97f4b65f541e02a99ceee2 +size 3941945016 diff --git a/model-00009-of-00092.safetensors b/model-00009-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..583d823b8d839570bcd7041852bc3a30c26b6791 --- /dev/null +++ b/model-00009-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7641b05d5a04c9de73e2e2ed3c644c7c8359b5049f219b17c6b50df597cd41b8 +size 3941945016 diff --git a/model-00010-of-00092.safetensors b/model-00010-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5625e80fd94575acacbc952944a347daf15bc80a --- /dev/null +++ b/model-00010-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b11e1b5061ad41b414303c354edf6f9eb1306f9766fff524a4042f37843dd7ab +size 3941945016 diff --git a/model-00011-of-00092.safetensors b/model-00011-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..db103deb6609efe716c53fb97628ba9df402758d --- /dev/null +++ b/model-00011-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0ff0e88b6ee8e4a063826b874ddcd2a8ac6554656819163d5b61aa36831ccb2 +size 3941946000 diff --git a/model-00012-of-00092.safetensors b/model-00012-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9a712d9c99dd3fc373b2bb1e8bc551c29bf6a1fc --- /dev/null +++ b/model-00012-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6466a2807bf05f0ad9692594253f616562b34a89ab4d6996defa21835c447647 +size 3941946000 diff --git a/model-00013-of-00092.safetensors b/model-00013-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3d3f660df54da9460a7f2c5f218a400ea3738d17 --- /dev/null +++ b/model-00013-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75ddfa9e346c02cf9aff2067f0110ba70e59cfc475afdee6e900474d9b73f99e +size 3941946000 diff --git a/model-00014-of-00092.safetensors b/model-00014-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6d9220876ec9bc59eec7c5717c2e2a251df1f850 --- /dev/null +++ b/model-00014-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c7dca430e5679422b738125a160d5d484ba55b32db28e2887f85a6cfbcf6b7a +size 3941946000 diff --git a/model-00015-of-00092.safetensors b/model-00015-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..90b7d1e2ed81867ca40bf33eb63ba8fcdb25af1a --- /dev/null +++ b/model-00015-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:249f98f6d42b67d699c2d244b5df000796e4432bd843f26ab39640597e49686e +size 3941946000 diff --git a/model-00016-of-00092.safetensors b/model-00016-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a6b662b48ef5c3f6f64b72f251dbebbc8d6e2e67 --- /dev/null +++ b/model-00016-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b66acc87692b8d8c794ff8fda0e0a2217ef7c9306daa5a90e97b77bdeac24b9c +size 3941946000 diff --git a/model-00017-of-00092.safetensors b/model-00017-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dcbec98bf209efeba4a545c8c4231ef2d087488d --- /dev/null +++ b/model-00017-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:361fa81c2ff26252d66f2938de1f0ff91046dffda8a5e85afe2550498e00df01 +size 3941946000 diff --git a/model-00018-of-00092.safetensors b/model-00018-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7ce031126daf4009f6b0f044306bac7a4fcaf844 --- /dev/null +++ b/model-00018-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5cf1c834832cae1a0a6800e87621091b57dc6641b57ebc8e75b2e99ab29f9e7 +size 3941946000 diff --git a/model-00019-of-00092.safetensors b/model-00019-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f37a91370e0fe93a46e6bd345c971363e0de1baf --- /dev/null +++ b/model-00019-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fd9d4ea2442838e9911e506233df72589841f81f849b7813e40c770e46ffb37 +size 3941946000 diff --git a/model-00020-of-00092.safetensors b/model-00020-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ae7068a02a311bd8ffd7fae04d1f36f2e0be164c --- /dev/null +++ b/model-00020-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:805da56848f53fe8ba7b1d4766041176b07050bb2d06636354179420a3ef7a53 +size 3941946000 diff --git a/model-00021-of-00092.safetensors b/model-00021-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4c26079064a6e0e8e4b4ed1a0299e8420e8d5d29 --- /dev/null +++ b/model-00021-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e70481fdbbb4b013e248a3978635db8149391cba0977b0af00f431bdf368a78b +size 3941946000 diff --git a/model-00022-of-00092.safetensors b/model-00022-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9c584190e218a5a6877b8b51782929681b5f085e --- /dev/null +++ b/model-00022-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:522a46ea7d953e8bac1a7ef71ef87d08559cce9181600f59363b4a03a37978ba +size 3941946000 diff --git a/model-00023-of-00092.safetensors b/model-00023-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dc810bc8267a36fb06371654cf4d055adb7dae2a --- /dev/null +++ b/model-00023-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4828ab751880a84b595764ad30da807ae4bfc7d6cd5060a467a5d4ee7c0472f9 +size 3941946000 diff --git a/model-00024-of-00092.safetensors b/model-00024-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f7536210e2e75896a3c7c9883939bc57b9327e01 --- /dev/null +++ b/model-00024-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd37f2bd39696f2879e47ee28775f25cb316189f31487c4820ec758ed3eb07e9 +size 3941946000 diff --git a/model-00025-of-00092.safetensors b/model-00025-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9869108a62c79e1bfa4b01738ec17c2814760862 --- /dev/null +++ b/model-00025-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:499cccb499dfe2a7c38413373b9ef4f7aeafcc3adb5273c993b51ecdf66a1af4 +size 3941946000 diff --git a/model-00026-of-00092.safetensors b/model-00026-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c36c81de5ceb4cd68616c6d4a2dc834332d25382 --- /dev/null +++ b/model-00026-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f74964374efe4e3ebbe44e6c664cfd5e69315ef16479c4fb69ec21494406647f +size 3941946000 diff --git a/model-00027-of-00092.safetensors b/model-00027-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7538bad9a24f7ecdb6c2bf50fdb8fb55a5411d9e --- /dev/null +++ b/model-00027-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f386ccd96a1e9269912c11da13474929ef51a642451017cf71df0403183e3d46 +size 3941946000 diff --git a/model-00028-of-00092.safetensors b/model-00028-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..47b5c4395e90bdc3bfca65b0426e42c419665266 --- /dev/null +++ b/model-00028-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9607d17b25225d77768fe976e412ac22e58b06ea7e5fedb41c0fb1e7c024aa3 +size 3941946000 diff --git a/model-00029-of-00092.safetensors b/model-00029-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ade71e46e55a0a07e5c779c1033d5b23d0aca560 --- /dev/null +++ b/model-00029-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90818dcdcef479199d3884e549597ca85eb1459fffb8d3ca1490df655062749e +size 3941946000 diff --git a/model-00030-of-00092.safetensors b/model-00030-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d53b3951f701cf9faca6d364eb2071bcda593265 --- /dev/null +++ b/model-00030-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f5c95e0c676d2e61ca2c2a64a1f93fec730b9e72595d62f341ab69669f4afe6 +size 3941946000 diff --git a/model-00031-of-00092.safetensors b/model-00031-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..75192b3e8191f540d6ac328d4b892f812d394201 --- /dev/null +++ b/model-00031-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7262032f0ae419b7281c7fe00cdb32da11d1851e25552a0c72426131a195f6a +size 3941946000 diff --git a/model-00032-of-00092.safetensors b/model-00032-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f00a028b94f4c36db1efbd8fb34ad53657de6032 --- /dev/null +++ b/model-00032-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d599db91bc26fc7f51e6313ad71eef3e17d9306c70384520caab9a0f3e69d8d3 +size 3941946000 diff --git a/model-00033-of-00092.safetensors b/model-00033-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9f79aaa4cf6250765ca22914e98b355be3b347ab --- /dev/null +++ b/model-00033-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ce02e0c5758d470bb953091aa074414532bbf094ff987c094731ed72de1d178 +size 3941946000 diff --git a/model-00034-of-00092.safetensors b/model-00034-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cd497c959da5f6c0bebb59c6a6cf32789f6496fc --- /dev/null +++ b/model-00034-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d26dbb8145811b8312bd1326e99534957c0cb8f14749b468afb526493c54fd4f +size 3941946000 diff --git a/model-00035-of-00092.safetensors b/model-00035-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..91e0f64487b5ce2f0ac5182c59c9abaa775955e4 --- /dev/null +++ b/model-00035-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2b95a853acc68338bdc9a25b8a06e95ae9eebe85c95739a6225e81e93d837dd +size 3941946000 diff --git a/model-00036-of-00092.safetensors b/model-00036-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c204754b52237f215a2613ca9287eaf6db874644 --- /dev/null +++ b/model-00036-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ea306c5fb06b73cc99ca0c1a0243047c78c5637d49908d98989fc80adef7623 +size 3941946000 diff --git a/model-00037-of-00092.safetensors b/model-00037-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..975ce023899126031190da13a215d9112eacb06b --- /dev/null +++ b/model-00037-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d172e2be799fb9207cfcd35790d5c827ae65cd631432c479b395a4da52c0d27 +size 3941946000 diff --git a/model-00038-of-00092.safetensors b/model-00038-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..046435caafe51a3731a1abae53295842037b44d1 --- /dev/null +++ b/model-00038-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97a20ab8c68afaaf94307353b8115d39be316c2aa1f71433d7cb134a2c598b85 +size 3941946000 diff --git a/model-00039-of-00092.safetensors b/model-00039-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..53134b127ae13cc8f03dde1474950819aadaf10e --- /dev/null +++ b/model-00039-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8220c62ba76eaa513af60b1cab88303e7d2dda98af483cb603279e2ecf2474d0 +size 3941946000 diff --git a/model-00040-of-00092.safetensors b/model-00040-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9840abe05e5b5388455c3f173d9031c2cf3c1b32 --- /dev/null +++ b/model-00040-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d977ba19ca442fe854b40ecdf24587241d36f6aa98828bc33e2d1415959b7594 +size 3941946000 diff --git a/model-00041-of-00092.safetensors b/model-00041-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a766971186b9224cac0cb521fd8af7ab17caaa85 --- /dev/null +++ b/model-00041-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3a0fb8ea2b84f942e0de29c7a815d03b984758c008c019839578a37dce2c011 +size 3941946000 diff --git a/model-00042-of-00092.safetensors b/model-00042-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d367ccdbede8478e9759a8424765aff0165be18a --- /dev/null +++ b/model-00042-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b5982626470e66a5e3675bf24409bcc6044dafcb9f8ed055b9232252547cee3 +size 3941946000 diff --git a/model-00043-of-00092.safetensors b/model-00043-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..02198e10ba7af68ac6ef1e4823ba82f92c148a89 --- /dev/null +++ b/model-00043-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37ec7e24ee7307a7beb1a186fd2f3505bc3deb955748990acbb0fea2f2cf82fd +size 3941946000 diff --git a/model-00044-of-00092.safetensors b/model-00044-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..062e8f482e738a1570f5dee7484deee22251a0c3 --- /dev/null +++ b/model-00044-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eec5e6b73a6c0df1f1575154a3e3ed7666adf33803267c30faae7550faa33b68 +size 3941946000 diff --git a/model-00045-of-00092.safetensors b/model-00045-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e46b5bd75a77f0f08ba438d9066721768a7e2089 --- /dev/null +++ b/model-00045-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dcd5b45b868f6993d03f3b5664f031937ecbb08d5a9a38b3daf72aab839f361 +size 3941946000 diff --git a/model-00046-of-00092.safetensors b/model-00046-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e1006cea1a552625019cd625446e07e860f45e46 --- /dev/null +++ b/model-00046-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32fe9214b2e51fc57c6bc180a2f7c90ab949135b8b52e9f926e6abdff6b44e8f +size 3941946000 diff --git a/model-00047-of-00092.safetensors b/model-00047-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6499d58ae0c98dad7ae869a7077abfb4537ac92a --- /dev/null +++ b/model-00047-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07957a95e73bc5c357b31e681b086413417fef3db448596b83a50369e67ca6b2 +size 3941946000 diff --git a/model-00048-of-00092.safetensors b/model-00048-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..27b70720d23867788abfe15e3fc36b9697021e75 --- /dev/null +++ b/model-00048-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c57f1f78fd768a7956c373bcf5a41616e8d01c5358dc8bad51a6477b85a4ec85 +size 3941946000 diff --git a/model-00049-of-00092.safetensors b/model-00049-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..76adf7543484a2db4151eeee9081f67b2fd326ee --- /dev/null +++ b/model-00049-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86c27727d56f395d7348a0b202d454d40661d1dd1125eebbf37eab1d09f409da +size 3941946000 diff --git a/model-00050-of-00092.safetensors b/model-00050-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cf6bc4219363711581895006a329eb9b3763370a --- /dev/null +++ b/model-00050-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:687cb273bfeff95fd54f89dbde8cf5a4d8245454ccbab89f09835eb57e82ac61 +size 3941946000 diff --git a/model-00051-of-00092.safetensors b/model-00051-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2219eca3232790f1624cf14c1dad896327412da7 --- /dev/null +++ b/model-00051-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3a7a42e6a6f8fa0eb882ca3161c50f7692cac44dbf1e523d8e93152df634a95 +size 3941946000 diff --git a/model-00052-of-00092.safetensors b/model-00052-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b2e366fc4fdd3d41a74f1af71d7bee870e118772 --- /dev/null +++ b/model-00052-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23906dc240eee83293d676f597efabeb73b9b2be898bda70603fbd390f9220bf +size 3941946000 diff --git a/model-00053-of-00092.safetensors b/model-00053-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e3a393f3474220ac09ad0317047c55a47e2d447a --- /dev/null +++ b/model-00053-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be920cf049b968c844e7a6e0266218eaee1cd8bc612cf4d9972629c04add882a +size 3941946000 diff --git a/model-00054-of-00092.safetensors b/model-00054-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..060691c43acf4c4f35e24af5f31079d459e54fd4 --- /dev/null +++ b/model-00054-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25dcab199ede5099063a4a211374952e15e95f864988f93cea999e1ac1be1825 +size 3941946000 diff --git a/model-00055-of-00092.safetensors b/model-00055-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e896c37c15b1cbd746a4690651bf8668e1b2d67b --- /dev/null +++ b/model-00055-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57c62fba715fb7373078f697eabda5c22a28a028f9a7b157d0eab44b6a2982dd +size 3941946000 diff --git a/model-00056-of-00092.safetensors b/model-00056-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f64bbd248d522fde98462b30d94e8777cc40754a --- /dev/null +++ b/model-00056-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0d8e2336a5b79acae36c8bc2fd8245b648e402c7c0a9fd27a9ad1cdcdc55e35 +size 3941946000 diff --git a/model-00057-of-00092.safetensors b/model-00057-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e5651787cd4810c2656d60a30e11b9370d251815 --- /dev/null +++ b/model-00057-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c928a35b63210c92caba603462aac155c988c2887814dfbaafb8507c4432bab +size 3941946000 diff --git a/model-00058-of-00092.safetensors b/model-00058-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a0042af51f7443161d3c2273c15ab201cb1e19f0 --- /dev/null +++ b/model-00058-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39abd3b08f1247e0c59ed096e41c328141831cd297e261c4f2f6d4d15605be04 +size 3941946000 diff --git a/model-00059-of-00092.safetensors b/model-00059-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bd068233148883fd67c4b923c8321662215bc2db --- /dev/null +++ b/model-00059-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee449fec8018e00c728e353ea91f4f6749645adafb621e85a3da98f18aa48b39 +size 3941946000 diff --git a/model-00060-of-00092.safetensors b/model-00060-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fa52da9fc6284eb301efa35dd1077abbcfb1aab4 --- /dev/null +++ b/model-00060-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cca12f50b985b8d566372a98a895432e66e889cd4997f37165d3aa3ad7927b9 +size 3941946000 diff --git a/model-00061-of-00092.safetensors b/model-00061-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b6221293eafebcd316b054fcb0b2266c92595ede --- /dev/null +++ b/model-00061-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:178e31d637b5d67e18deacac90eac7c19e2ed0381ba18967665740f979797e19 +size 3941946000 diff --git a/model-00062-of-00092.safetensors b/model-00062-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cebca0fa0c05007dc868347fb0ffd749fbf8c13a --- /dev/null +++ b/model-00062-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfd0f735b8e608a48af211b8e17836ce7b81ce91c69dd20653c71882b129f902 +size 3941946000 diff --git a/model-00063-of-00092.safetensors b/model-00063-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..23e4df9a33c13767a6ec418def44202035cba526 --- /dev/null +++ b/model-00063-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f79b931f9901303c4eaa2f142631375731428e685298d731d9e96b450c9579d +size 3941946000 diff --git a/model-00064-of-00092.safetensors b/model-00064-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9b081e774cc85cfbc438145dae36a566d85fbe84 --- /dev/null +++ b/model-00064-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e7154a05437423b6a1820c7cffb130ceb2a5a9b2b99ab0c868a38bb3bb8eb1f +size 3941946000 diff --git a/model-00065-of-00092.safetensors b/model-00065-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a3f2d429b3f5066d674167c4732e0905462fffbf --- /dev/null +++ b/model-00065-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b981b155390b43bd39b2a5e3e568c1991b8d85c5966700fd2e77609af2817bd +size 3941946000 diff --git a/model-00066-of-00092.safetensors b/model-00066-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1bffedee3763192b750cae595c75962ab1e589d1 --- /dev/null +++ b/model-00066-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e5fa0a4798c9c173142b82589a5fc21208a54f81caa5464d52d4dc919839e35 +size 3941946000 diff --git a/model-00067-of-00092.safetensors b/model-00067-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8b6aaaa00e0d815ed997173205f50e455461fca1 --- /dev/null +++ b/model-00067-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7642e77c5b79fd69a1b3a702752cc49a9b9e6c0742615a7dffae32485bccf8dc +size 3941946000 diff --git a/model-00068-of-00092.safetensors b/model-00068-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..06da087afff80bb4c47db304a95a6925e03da944 --- /dev/null +++ b/model-00068-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2acab87829de540864f267c0c460ad2dd3bf4de8c6193336d803c69e68c0e118 +size 3941946000 diff --git a/model-00069-of-00092.safetensors b/model-00069-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..03f442810bcb21897a9f39b11b02d70adee549d9 --- /dev/null +++ b/model-00069-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53ab4c3e7bda5f956fac92d641f4fa0f59ff9eb76b17f6f5784292aa91223459 +size 3941946000 diff --git a/model-00070-of-00092.safetensors b/model-00070-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..565bc1e95f09276ef21c6d99b32d364aaf2677f4 --- /dev/null +++ b/model-00070-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff7c3e8ac7fc32e94301f5c811f633d1cd7671c581e4afa9e3b71c3ad5900d41 +size 3941946000 diff --git a/model-00071-of-00092.safetensors b/model-00071-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bd260e09780ee7de5bd10e0b5bb6fe5eda517354 --- /dev/null +++ b/model-00071-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:219f7d0d09cf60950f0afa6bd219801fe9b740d999ae4bcd6b29f8b067bbbe65 +size 3941946000 diff --git a/model-00072-of-00092.safetensors b/model-00072-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..80494ca1116d7b0c82987013b5d0d4539042c408 --- /dev/null +++ b/model-00072-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e6c90d3e3810dce5d726f3709b5c090972c2760a49179bbaf501e9350d5dfae +size 3941946000 diff --git a/model-00073-of-00092.safetensors b/model-00073-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..679ab1ed65baa9019ed8e2b6b1c7fa89b91c0185 --- /dev/null +++ b/model-00073-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69d544b89fbc0c8f641dca9fc57fb69b40b471f9d0af4e8ceebc509b9bd846bf +size 3941946000 diff --git a/model-00074-of-00092.safetensors b/model-00074-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..665812199c35801b6616ee07508f3ab3063fcbe0 --- /dev/null +++ b/model-00074-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:085c3296e419064f7aaf27994ce768fb65e670aed0c4de8149203a82bf3b3f95 +size 3941946000 diff --git a/model-00075-of-00092.safetensors b/model-00075-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..36388d8bbdd51c0fae330f4bdf19e8f4b2a399c3 --- /dev/null +++ b/model-00075-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:532e038f6687377fdc85f8009b4b1b304cc45a9cff49af9dc81e031465a5fe8a +size 3941946000 diff --git a/model-00076-of-00092.safetensors b/model-00076-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..04011111bcd77aa168a80c4b22a4403dc02eea28 --- /dev/null +++ b/model-00076-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:595028c19b4c94029a7a64500de9d5127f698a5cd5f0347e0a071db272a35322 +size 3941946000 diff --git a/model-00077-of-00092.safetensors b/model-00077-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..11a35cfbfa4ad6383a928c00a1051c98479cc59a --- /dev/null +++ b/model-00077-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4bafd0685064c6855c60bce9bffcf99fb0b29e80b6603492c6c3cac46cdffa1 +size 3941946000 diff --git a/model-00078-of-00092.safetensors b/model-00078-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..37b739ceada56331b028250838ec1aafbcc91701 --- /dev/null +++ b/model-00078-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be67adfc219969301f298e9fbea60513ec0470971e47fa7c3a6070ed3bdb0956 +size 3941946000 diff --git a/model-00079-of-00092.safetensors b/model-00079-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ac23cb22b66bb24938ded37fe0ca9019c946e17f --- /dev/null +++ b/model-00079-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fb5c4b4465d340d7dacf948dfd8d65c634cb9ec8f754596083365e232babac3 +size 3941946000 diff --git a/model-00080-of-00092.safetensors b/model-00080-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..edc4d51c0e7e2198e8f21943cefbfdd1a009c765 --- /dev/null +++ b/model-00080-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6810cc361fe280843675844645d0211bca0546a8ef33464d91dd47940205317a +size 3941946000 diff --git a/model-00081-of-00092.safetensors b/model-00081-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e17cb0fb3ee7a45c35152b0590c86bff180de455 --- /dev/null +++ b/model-00081-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:593dce45d7e5a6feba3bbc00a928911b6242906b7c934d263d3d66218f5a6159 +size 3941946000 diff --git a/model-00082-of-00092.safetensors b/model-00082-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..971106cc33b860833bdd0fdce22e8ef5641f20e2 --- /dev/null +++ b/model-00082-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a29714ca5445705fd6ca4609f1775fb31cd3d338abccaf8fd768ccbe0049cbb +size 3941946000 diff --git a/model-00083-of-00092.safetensors b/model-00083-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4a503262f35e069e222f10e3e1e450c80e70beab --- /dev/null +++ b/model-00083-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c62679b47cde1adb854a9de8506b1e62fd4dafc8c029780f8228234fb2dbe8f +size 3941946000 diff --git a/model-00084-of-00092.safetensors b/model-00084-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fe4c41b438edcf6300f146dc93722d53fe244ae1 --- /dev/null +++ b/model-00084-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e73e8c4a224489ba6401ba3420a0dc12a8978acc4a5da3f968c6e8e6169eb0e +size 3941946000 diff --git a/model-00085-of-00092.safetensors b/model-00085-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c57b2477936e573730f627dae25c87ea34b63b4c --- /dev/null +++ b/model-00085-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a8585b73d4ab24e73dbbad803269cd8d8e0eef795ebd66d4f5b40a0c73a782b +size 3941946000 diff --git a/model-00086-of-00092.safetensors b/model-00086-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4cb5d5c50afd285b3808c4764a0380137e778445 --- /dev/null +++ b/model-00086-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5111ae197b208badc1ea31c0eaafe8a49e649862015a023e712f500e3ced464a +size 3941946000 diff --git a/model-00087-of-00092.safetensors b/model-00087-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..efb225cc0719489a22d98cb239cd8612314e8492 --- /dev/null +++ b/model-00087-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f04c69b8f445d91720f7c389613b3927425fc38be5027af99467029f860cdeb +size 3941946000 diff --git a/model-00088-of-00092.safetensors b/model-00088-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9a50bb6fae4b25cbf86eafb0100a556e809b4eda --- /dev/null +++ b/model-00088-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:922beebb36eafa20e410a37737eee7c6d16d8114d1dd09c4ebccc703d51e9537 +size 3941946000 diff --git a/model-00089-of-00092.safetensors b/model-00089-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4f68571c0463a0e0c57e94aa115dbb64a7355f09 --- /dev/null +++ b/model-00089-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd76187e5c79aefc3c6fad87a48c7339f6e5960c62328be1a3934f606438e101 +size 3941946000 diff --git a/model-00090-of-00092.safetensors b/model-00090-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cbf33d1baa193a7f269827d36f96df0fda04c448 --- /dev/null +++ b/model-00090-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2c5c3b7d5798182b92b711177db1abd4805ab646a2450d792d8932cc3cc1330 +size 3941946000 diff --git a/model-00091-of-00092.safetensors b/model-00091-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c63f425d7ec7a84aa32a85777922b0bda1f102b1 --- /dev/null +++ b/model-00091-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41496ad8b78d3ffa537482a7af105055a83a271e9a10b4364b663362094088be +size 3941946000 diff --git a/model-00092-of-00092.safetensors b/model-00092-of-00092.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..59818eb13ea7972581902f077eca5ddf72d486f1 --- /dev/null +++ b/model-00092-of-00092.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a3160dfca14b9b6f2d46f7d63228903ebaa890b169e4fe36e77366e35d73985 +size 5493849232 diff --git a/model.safetensors.index.json b/model.safetensors.index.json new file mode 100644 index 0000000000000000000000000000000000000000..19bba211162e856fdef26980cd437c52050ad693 --- /dev/null +++ b/model.safetensors.index.json @@ -0,0 +1,87560 @@ +{ + "weight_map": { + "model.embed_tokens.weight": "model-00001-of-00092.safetensors", + "model.layers.0.input_layernorm.weight": "model-00001-of-00092.safetensors", + "model.layers.0.mlp.down_proj.weight": "model-00001-of-00092.safetensors", + "model.layers.0.mlp.down_proj.weight_scale": "model-00001-of-00092.safetensors", + "model.layers.0.mlp.gate_proj.weight": "model-00001-of-00092.safetensors", + "model.layers.0.mlp.gate_proj.weight_scale": "model-00001-of-00092.safetensors", + "model.layers.0.mlp.up_proj.weight": "model-00001-of-00092.safetensors", + "model.layers.0.mlp.up_proj.weight_scale": "model-00001-of-00092.safetensors", + "model.layers.0.post_attention_layernorm.weight": "model-00001-of-00092.safetensors", + "model.layers.0.self_attn.k_norm.weight": "model-00001-of-00092.safetensors", + "model.layers.0.self_attn.k_proj.bias": "model-00001-of-00092.safetensors", + "model.layers.0.self_attn.k_proj.weight": "model-00001-of-00092.safetensors", + "model.layers.0.self_attn.k_proj.weight_scale": "model-00001-of-00092.safetensors", + "model.layers.0.self_attn.o_proj.weight": "model-00001-of-00092.safetensors", + "model.layers.0.self_attn.o_proj.weight_scale": "model-00001-of-00092.safetensors", + "model.layers.0.self_attn.q_norm.weight": "model-00001-of-00092.safetensors", + "model.layers.0.self_attn.q_proj.bias": "model-00001-of-00092.safetensors", + "model.layers.0.self_attn.q_proj.weight": "model-00001-of-00092.safetensors", + "model.layers.0.self_attn.q_proj.weight_scale": "model-00001-of-00092.safetensors", + "model.layers.0.self_attn.v_proj.bias": "model-00001-of-00092.safetensors", + "model.layers.0.self_attn.v_proj.weight": "model-00001-of-00092.safetensors", + "model.layers.0.self_attn.v_proj.weight_scale": "model-00001-of-00092.safetensors", + "model.layers.1.input_layernorm.weight": "model-00002-of-00092.safetensors", + "model.layers.1.mlp.down_proj.weight": "model-00002-of-00092.safetensors", + "model.layers.1.mlp.down_proj.weight_scale": "model-00002-of-00092.safetensors", + "model.layers.1.mlp.gate_proj.weight": "model-00002-of-00092.safetensors", + "model.layers.1.mlp.gate_proj.weight_scale": "model-00002-of-00092.safetensors", + "model.layers.1.mlp.up_proj.weight": "model-00002-of-00092.safetensors", + "model.layers.1.mlp.up_proj.weight_scale": "model-00002-of-00092.safetensors", + "model.layers.1.post_attention_layernorm.weight": "model-00002-of-00092.safetensors", + "model.layers.1.self_attn.k_norm.weight": "model-00002-of-00092.safetensors", + "model.layers.1.self_attn.k_proj.bias": "model-00002-of-00092.safetensors", + "model.layers.1.self_attn.k_proj.weight": "model-00002-of-00092.safetensors", + "model.layers.1.self_attn.k_proj.weight_scale": "model-00002-of-00092.safetensors", + "model.layers.1.self_attn.o_proj.weight": "model-00002-of-00092.safetensors", + "model.layers.1.self_attn.o_proj.weight_scale": "model-00002-of-00092.safetensors", + "model.layers.1.self_attn.q_norm.weight": "model-00002-of-00092.safetensors", + "model.layers.1.self_attn.q_proj.bias": "model-00002-of-00092.safetensors", + "model.layers.1.self_attn.q_proj.weight": "model-00002-of-00092.safetensors", + "model.layers.1.self_attn.q_proj.weight_scale": "model-00002-of-00092.safetensors", + "model.layers.1.self_attn.v_proj.bias": "model-00002-of-00092.safetensors", + "model.layers.1.self_attn.v_proj.weight": "model-00002-of-00092.safetensors", + "model.layers.1.self_attn.v_proj.weight_scale": "model-00002-of-00092.safetensors", + "model.layers.2.input_layernorm.weight": "model-00003-of-00092.safetensors", + "model.layers.2.mlp.down_proj.weight": "model-00003-of-00092.safetensors", + "model.layers.2.mlp.down_proj.weight_scale": "model-00003-of-00092.safetensors", + "model.layers.2.mlp.gate_proj.weight": "model-00003-of-00092.safetensors", + "model.layers.2.mlp.gate_proj.weight_scale": "model-00003-of-00092.safetensors", + "model.layers.2.mlp.up_proj.weight": "model-00003-of-00092.safetensors", + "model.layers.2.mlp.up_proj.weight_scale": "model-00003-of-00092.safetensors", + "model.layers.2.post_attention_layernorm.weight": "model-00003-of-00092.safetensors", + "model.layers.2.self_attn.k_norm.weight": "model-00003-of-00092.safetensors", + "model.layers.2.self_attn.k_proj.bias": "model-00003-of-00092.safetensors", + "model.layers.2.self_attn.k_proj.weight": "model-00003-of-00092.safetensors", + "model.layers.2.self_attn.k_proj.weight_scale": "model-00003-of-00092.safetensors", + "model.layers.2.self_attn.o_proj.weight": "model-00003-of-00092.safetensors", + "model.layers.2.self_attn.o_proj.weight_scale": "model-00003-of-00092.safetensors", + "model.layers.2.self_attn.q_norm.weight": "model-00003-of-00092.safetensors", + "model.layers.2.self_attn.q_proj.bias": "model-00003-of-00092.safetensors", + "model.layers.2.self_attn.q_proj.weight": "model-00003-of-00092.safetensors", + "model.layers.2.self_attn.q_proj.weight_scale": "model-00003-of-00092.safetensors", + "model.layers.2.self_attn.v_proj.bias": "model-00003-of-00092.safetensors", + "model.layers.2.self_attn.v_proj.weight": "model-00003-of-00092.safetensors", + "model.layers.2.self_attn.v_proj.weight_scale": "model-00003-of-00092.safetensors", + "model.layers.3.input_layernorm.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.0.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.0.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.0.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.0.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.0.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.0.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.1.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.1.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.1.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.1.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.1.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.1.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.10.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.10.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.10.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.10.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.10.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.10.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.100.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.100.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.100.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.100.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.100.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.100.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.101.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.101.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.101.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.101.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.101.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.101.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.102.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.102.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.102.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.102.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.102.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.102.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.103.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.103.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.103.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.103.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.103.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.103.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.104.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.104.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.104.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.104.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.104.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.104.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.105.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.105.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.105.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.105.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.105.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.105.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.106.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.106.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.106.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.106.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.106.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.106.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.107.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.107.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.107.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.107.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.107.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.107.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.108.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.108.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.108.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.108.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.108.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.108.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.109.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.109.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.109.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.109.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.109.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.109.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.11.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.11.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.11.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.11.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.11.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.11.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.110.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.110.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.110.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.110.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.110.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.110.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.111.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.111.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.111.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.111.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.111.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.111.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.112.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.112.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.112.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.112.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.112.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.112.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.113.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.113.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.113.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.113.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.113.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.113.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.114.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.114.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.114.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.114.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.114.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.114.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.115.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.115.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.115.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.115.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.115.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.115.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.116.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.116.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.116.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.116.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.116.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.116.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.117.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.117.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.117.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.117.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.117.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.117.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.118.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.118.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.118.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.118.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.118.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.118.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.119.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.119.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.119.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.119.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.119.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.119.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.12.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.12.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.12.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.12.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.12.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.12.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.120.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.120.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.120.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.120.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.120.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.120.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.121.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.121.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.121.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.121.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.121.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.121.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.122.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.122.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.122.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.122.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.122.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.122.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.123.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.123.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.123.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.123.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.123.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.123.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.124.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.124.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.124.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.124.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.124.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.124.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.125.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.125.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.125.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.125.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.125.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.125.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.126.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.126.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.126.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.126.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.126.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.126.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.127.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.127.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.127.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.127.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.127.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.127.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.128.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.128.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.128.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.128.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.128.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.128.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.129.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.129.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.129.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.129.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.129.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.129.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.13.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.13.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.13.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.13.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.13.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.13.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.130.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.130.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.130.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.130.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.130.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.130.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.131.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.131.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.131.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.131.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.131.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.131.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.132.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.132.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.132.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.132.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.132.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.132.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.133.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.133.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.133.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.133.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.133.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.133.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.134.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.134.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.134.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.134.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.134.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.134.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.135.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.135.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.135.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.135.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.135.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.135.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.136.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.136.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.136.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.136.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.136.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.136.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.137.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.137.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.137.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.137.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.137.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.137.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.138.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.138.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.138.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.138.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.138.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.138.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.139.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.139.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.139.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.139.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.139.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.139.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.14.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.14.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.14.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.14.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.14.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.14.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.140.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.140.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.140.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.140.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.140.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.140.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.141.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.141.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.141.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.141.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.141.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.141.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.142.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.142.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.142.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.142.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.142.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.142.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.143.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.143.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.143.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.143.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.143.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.143.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.144.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.144.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.144.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.144.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.144.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.144.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.145.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.145.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.145.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.145.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.145.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.145.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.146.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.146.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.146.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.146.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.146.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.146.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.147.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.147.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.147.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.147.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.147.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.147.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.148.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.148.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.148.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.148.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.148.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.148.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.149.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.149.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.149.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.149.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.149.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.149.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.15.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.15.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.15.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.15.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.15.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.15.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.150.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.150.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.150.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.150.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.150.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.150.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.151.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.151.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.151.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.151.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.151.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.151.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.152.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.152.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.152.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.152.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.152.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.152.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.153.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.153.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.153.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.153.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.153.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.153.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.154.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.154.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.154.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.154.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.154.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.154.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.155.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.155.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.155.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.155.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.155.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.155.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.156.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.156.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.156.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.156.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.156.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.156.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.157.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.157.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.157.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.157.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.157.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.157.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.158.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.158.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.158.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.158.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.158.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.158.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.159.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.159.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.159.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.159.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.159.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.159.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.16.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.16.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.16.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.16.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.16.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.16.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.17.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.17.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.17.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.17.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.17.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.17.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.18.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.18.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.18.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.18.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.18.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.18.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.19.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.19.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.19.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.19.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.19.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.19.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.2.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.2.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.2.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.2.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.2.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.2.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.20.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.20.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.20.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.20.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.20.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.20.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.21.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.21.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.21.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.21.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.21.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.21.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.22.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.22.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.22.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.22.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.22.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.22.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.23.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.23.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.23.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.23.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.23.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.23.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.24.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.24.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.24.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.24.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.24.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.24.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.25.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.25.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.25.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.25.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.25.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.25.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.26.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.26.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.26.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.26.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.26.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.26.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.27.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.27.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.27.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.27.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.27.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.27.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.28.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.28.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.28.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.28.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.28.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.28.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.29.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.29.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.29.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.29.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.29.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.29.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.3.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.3.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.3.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.3.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.3.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.3.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.30.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.30.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.30.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.30.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.30.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.30.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.31.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.31.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.31.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.31.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.31.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.31.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.32.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.32.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.32.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.32.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.32.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.32.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.33.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.33.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.33.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.33.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.33.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.33.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.34.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.34.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.34.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.34.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.34.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.34.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.35.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.35.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.35.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.35.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.35.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.35.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.36.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.36.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.36.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.36.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.36.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.36.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.37.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.37.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.37.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.37.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.37.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.37.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.38.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.38.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.38.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.38.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.38.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.38.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.39.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.39.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.39.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.39.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.39.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.39.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.4.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.4.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.4.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.4.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.4.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.4.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.40.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.40.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.40.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.40.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.40.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.40.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.41.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.41.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.41.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.41.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.41.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.41.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.42.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.42.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.42.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.42.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.42.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.42.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.43.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.43.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.43.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.43.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.43.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.43.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.44.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.44.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.44.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.44.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.44.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.44.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.45.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.45.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.45.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.45.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.45.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.45.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.46.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.46.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.46.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.46.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.46.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.46.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.47.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.47.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.47.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.47.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.47.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.47.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.48.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.48.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.48.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.48.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.48.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.48.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.49.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.49.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.49.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.49.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.49.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.49.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.5.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.5.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.5.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.5.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.5.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.5.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.50.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.50.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.50.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.50.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.50.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.50.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.51.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.51.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.51.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.51.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.51.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.51.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.52.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.52.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.52.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.52.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.52.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.52.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.53.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.53.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.53.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.53.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.53.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.53.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.54.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.54.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.54.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.54.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.54.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.54.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.55.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.55.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.55.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.55.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.55.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.55.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.56.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.56.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.56.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.56.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.56.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.56.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.57.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.57.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.57.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.57.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.57.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.57.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.58.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.58.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.58.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.58.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.58.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.58.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.59.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.59.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.59.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.59.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.59.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.59.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.6.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.6.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.6.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.6.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.6.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.6.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.60.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.60.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.60.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.60.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.60.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.60.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.61.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.61.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.61.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.61.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.61.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.61.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.62.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.62.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.62.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.62.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.62.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.62.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.63.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.63.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.63.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.63.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.63.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.63.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.64.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.64.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.64.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.64.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.64.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.64.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.65.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.65.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.65.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.65.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.65.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.65.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.66.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.66.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.66.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.66.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.66.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.66.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.67.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.67.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.67.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.67.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.67.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.67.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.68.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.68.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.68.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.68.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.68.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.68.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.69.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.69.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.69.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.69.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.69.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.69.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.7.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.7.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.7.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.7.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.7.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.7.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.70.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.70.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.70.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.70.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.70.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.70.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.71.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.71.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.71.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.71.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.71.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.71.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.72.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.72.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.72.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.72.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.72.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.72.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.73.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.73.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.73.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.73.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.73.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.73.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.74.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.74.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.74.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.74.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.74.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.74.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.75.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.75.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.75.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.75.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.75.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.75.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.76.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.76.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.76.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.76.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.76.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.76.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.77.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.77.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.77.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.77.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.77.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.77.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.78.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.78.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.78.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.78.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.78.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.78.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.79.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.79.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.79.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.79.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.79.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.79.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.8.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.8.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.8.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.8.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.8.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.8.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.80.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.80.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.80.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.80.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.80.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.80.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.81.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.81.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.81.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.81.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.81.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.81.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.82.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.82.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.82.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.82.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.82.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.82.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.83.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.83.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.83.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.83.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.83.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.83.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.84.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.84.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.84.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.84.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.84.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.84.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.85.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.85.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.85.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.85.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.85.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.85.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.86.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.86.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.86.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.86.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.86.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.86.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.87.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.87.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.87.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.87.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.87.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.87.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.88.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.88.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.88.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.88.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.88.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.88.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.89.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.89.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.89.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.89.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.89.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.89.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.9.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.9.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.9.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.9.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.9.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.9.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.90.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.90.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.90.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.90.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.90.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.90.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.91.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.91.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.91.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.91.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.91.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.91.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.92.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.92.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.92.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.92.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.92.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.92.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.93.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.93.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.93.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.93.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.93.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.93.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.94.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.94.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.94.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.94.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.94.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.94.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.95.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.95.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.95.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.95.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.95.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.95.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.96.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.96.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.96.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.96.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.96.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.96.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.97.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.97.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.97.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.97.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.97.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.97.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.98.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.98.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.98.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.98.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.98.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.98.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.99.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.99.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.99.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.99.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.99.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.experts.99.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.gate.e_score_correction_bias": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.gate.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.shared_experts.down_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.shared_experts.down_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.shared_experts.gate_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.shared_experts.gate_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.shared_experts.up_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.mlp.shared_experts.up_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.post_attention_layernorm.weight": "model-00004-of-00092.safetensors", + "model.layers.3.self_attn.k_norm.weight": "model-00004-of-00092.safetensors", + "model.layers.3.self_attn.k_proj.bias": "model-00004-of-00092.safetensors", + "model.layers.3.self_attn.k_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.self_attn.k_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.self_attn.o_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.self_attn.o_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.self_attn.q_norm.weight": "model-00004-of-00092.safetensors", + "model.layers.3.self_attn.q_proj.bias": "model-00004-of-00092.safetensors", + "model.layers.3.self_attn.q_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.self_attn.q_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.3.self_attn.v_proj.bias": "model-00004-of-00092.safetensors", + "model.layers.3.self_attn.v_proj.weight": "model-00004-of-00092.safetensors", + "model.layers.3.self_attn.v_proj.weight_scale": "model-00004-of-00092.safetensors", + "model.layers.4.input_layernorm.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.0.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.0.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.0.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.0.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.0.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.0.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.1.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.1.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.1.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.1.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.1.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.1.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.10.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.10.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.10.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.10.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.10.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.10.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.100.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.100.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.100.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.100.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.100.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.100.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.101.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.101.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.101.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.101.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.101.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.101.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.102.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.102.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.102.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.102.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.102.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.102.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.103.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.103.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.103.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.103.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.103.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.103.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.104.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.104.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.104.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.104.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.104.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.104.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.105.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.105.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.105.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.105.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.105.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.105.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.106.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.106.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.106.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.106.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.106.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.106.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.107.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.107.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.107.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.107.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.107.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.107.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.108.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.108.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.108.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.108.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.108.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.108.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.109.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.109.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.109.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.109.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.109.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.109.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.11.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.11.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.11.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.11.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.11.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.11.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.110.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.110.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.110.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.110.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.110.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.110.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.111.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.111.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.111.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.111.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.111.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.111.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.112.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.112.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.112.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.112.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.112.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.112.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.113.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.113.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.113.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.113.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.113.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.113.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.114.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.114.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.114.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.114.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.114.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.114.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.115.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.115.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.115.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.115.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.115.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.115.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.116.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.116.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.116.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.116.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.116.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.116.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.117.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.117.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.117.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.117.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.117.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.117.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.118.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.118.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.118.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.118.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.118.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.118.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.119.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.119.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.119.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.119.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.119.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.119.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.12.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.12.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.12.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.12.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.12.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.12.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.120.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.120.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.120.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.120.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.120.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.120.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.121.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.121.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.121.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.121.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.121.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.121.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.122.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.122.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.122.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.122.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.122.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.122.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.123.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.123.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.123.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.123.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.123.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.123.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.124.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.124.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.124.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.124.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.124.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.124.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.125.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.125.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.125.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.125.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.125.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.125.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.126.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.126.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.126.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.126.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.126.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.126.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.127.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.127.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.127.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.127.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.127.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.127.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.128.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.128.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.128.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.128.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.128.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.128.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.129.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.129.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.129.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.129.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.129.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.129.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.13.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.13.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.13.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.13.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.13.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.13.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.130.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.130.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.130.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.130.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.130.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.130.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.131.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.131.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.131.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.131.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.131.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.131.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.132.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.132.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.132.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.132.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.132.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.132.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.133.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.133.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.133.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.133.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.133.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.133.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.134.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.134.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.134.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.134.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.134.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.134.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.135.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.135.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.135.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.135.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.135.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.135.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.136.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.136.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.136.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.136.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.136.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.136.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.137.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.137.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.137.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.137.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.137.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.137.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.138.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.138.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.138.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.138.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.138.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.138.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.139.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.139.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.139.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.139.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.139.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.139.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.14.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.14.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.14.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.14.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.14.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.14.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.140.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.140.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.140.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.140.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.140.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.140.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.141.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.141.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.141.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.141.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.141.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.141.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.142.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.142.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.142.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.142.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.142.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.142.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.143.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.143.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.143.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.143.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.143.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.143.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.144.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.144.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.144.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.144.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.144.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.144.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.145.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.145.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.145.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.145.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.145.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.145.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.146.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.146.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.146.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.146.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.146.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.146.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.147.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.147.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.147.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.147.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.147.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.147.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.148.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.148.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.148.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.148.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.148.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.148.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.149.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.149.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.149.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.149.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.149.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.149.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.15.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.15.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.15.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.15.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.15.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.15.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.150.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.150.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.150.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.150.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.150.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.150.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.151.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.151.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.151.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.151.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.151.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.151.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.152.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.152.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.152.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.152.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.152.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.152.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.153.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.153.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.153.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.153.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.153.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.153.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.154.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.154.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.154.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.154.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.154.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.154.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.155.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.155.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.155.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.155.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.155.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.155.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.156.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.156.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.156.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.156.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.156.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.156.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.157.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.157.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.157.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.157.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.157.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.157.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.158.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.158.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.158.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.158.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.158.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.158.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.159.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.159.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.159.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.159.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.159.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.159.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.16.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.16.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.16.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.16.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.16.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.16.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.17.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.17.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.17.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.17.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.17.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.17.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.18.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.18.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.18.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.18.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.18.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.18.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.19.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.19.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.19.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.19.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.19.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.19.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.2.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.2.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.2.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.2.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.2.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.2.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.20.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.20.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.20.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.20.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.20.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.20.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.21.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.21.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.21.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.21.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.21.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.21.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.22.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.22.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.22.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.22.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.22.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.22.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.23.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.23.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.23.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.23.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.23.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.23.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.24.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.24.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.24.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.24.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.24.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.24.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.25.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.25.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.25.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.25.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.25.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.25.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.26.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.26.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.26.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.26.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.26.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.26.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.27.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.27.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.27.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.27.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.27.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.27.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.28.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.28.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.28.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.28.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.28.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.28.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.29.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.29.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.29.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.29.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.29.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.29.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.3.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.3.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.3.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.3.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.3.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.3.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.30.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.30.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.30.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.30.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.30.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.30.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.31.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.31.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.31.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.31.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.31.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.31.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.32.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.32.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.32.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.32.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.32.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.32.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.33.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.33.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.33.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.33.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.33.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.33.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.34.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.34.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.34.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.34.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.34.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.34.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.35.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.35.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.35.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.35.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.35.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.35.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.36.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.36.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.36.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.36.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.36.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.36.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.37.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.37.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.37.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.37.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.37.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.37.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.38.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.38.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.38.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.38.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.38.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.38.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.39.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.39.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.39.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.39.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.39.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.39.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.4.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.4.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.4.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.4.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.4.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.4.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.40.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.40.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.40.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.40.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.40.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.40.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.41.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.41.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.41.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.41.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.41.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.41.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.42.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.42.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.42.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.42.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.42.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.42.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.43.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.43.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.43.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.43.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.43.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.43.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.44.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.44.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.44.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.44.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.44.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.44.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.45.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.45.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.45.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.45.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.45.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.45.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.46.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.46.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.46.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.46.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.46.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.46.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.47.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.47.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.47.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.47.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.47.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.47.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.48.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.48.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.48.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.48.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.48.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.48.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.49.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.49.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.49.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.49.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.49.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.49.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.5.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.5.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.5.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.5.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.5.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.5.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.50.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.50.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.50.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.50.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.50.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.50.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.51.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.51.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.51.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.51.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.51.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.51.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.52.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.52.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.52.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.52.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.52.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.52.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.53.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.53.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.53.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.53.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.53.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.53.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.54.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.54.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.54.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.54.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.54.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.54.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.55.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.55.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.55.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.55.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.55.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.55.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.56.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.56.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.56.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.56.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.56.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.56.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.57.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.57.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.57.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.57.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.57.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.57.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.58.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.58.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.58.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.58.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.58.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.58.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.59.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.59.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.59.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.59.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.59.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.59.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.6.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.6.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.6.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.6.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.6.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.6.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.60.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.60.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.60.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.60.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.60.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.60.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.61.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.61.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.61.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.61.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.61.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.61.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.62.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.62.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.62.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.62.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.62.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.62.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.63.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.63.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.63.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.63.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.63.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.63.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.64.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.64.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.64.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.64.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.64.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.64.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.65.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.65.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.65.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.65.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.65.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.65.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.66.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.66.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.66.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.66.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.66.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.66.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.67.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.67.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.67.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.67.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.67.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.67.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.68.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.68.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.68.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.68.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.68.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.68.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.69.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.69.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.69.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.69.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.69.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.69.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.7.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.7.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.7.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.7.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.7.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.7.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.70.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.70.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.70.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.70.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.70.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.70.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.71.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.71.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.71.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.71.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.71.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.71.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.72.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.72.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.72.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.72.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.72.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.72.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.73.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.73.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.73.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.73.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.73.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.73.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.74.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.74.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.74.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.74.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.74.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.74.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.75.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.75.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.75.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.75.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.75.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.75.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.76.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.76.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.76.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.76.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.76.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.76.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.77.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.77.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.77.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.77.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.77.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.77.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.78.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.78.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.78.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.78.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.78.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.78.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.79.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.79.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.79.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.79.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.79.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.79.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.8.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.8.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.8.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.8.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.8.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.8.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.80.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.80.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.80.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.80.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.80.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.80.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.81.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.81.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.81.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.81.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.81.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.81.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.82.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.82.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.82.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.82.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.82.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.82.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.83.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.83.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.83.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.83.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.83.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.83.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.84.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.84.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.84.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.84.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.84.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.84.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.85.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.85.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.85.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.85.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.85.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.85.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.86.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.86.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.86.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.86.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.86.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.86.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.87.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.87.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.87.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.87.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.87.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.87.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.88.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.88.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.88.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.88.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.88.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.88.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.89.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.89.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.89.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.89.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.89.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.89.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.9.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.9.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.9.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.9.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.9.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.9.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.90.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.90.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.90.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.90.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.90.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.90.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.91.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.91.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.91.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.91.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.91.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.91.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.92.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.92.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.92.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.92.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.92.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.92.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.93.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.93.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.93.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.93.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.93.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.93.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.94.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.94.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.94.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.94.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.94.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.94.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.95.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.95.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.95.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.95.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.95.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.95.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.96.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.96.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.96.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.96.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.96.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.96.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.97.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.97.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.97.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.97.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.97.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.97.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.98.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.98.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.98.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.98.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.98.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.98.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.99.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.99.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.99.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.99.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.99.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.experts.99.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.gate.e_score_correction_bias": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.gate.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.shared_experts.down_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.shared_experts.down_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.shared_experts.gate_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.shared_experts.gate_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.shared_experts.up_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.mlp.shared_experts.up_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.post_attention_layernorm.weight": "model-00005-of-00092.safetensors", + "model.layers.4.self_attn.k_norm.weight": "model-00005-of-00092.safetensors", + "model.layers.4.self_attn.k_proj.bias": "model-00005-of-00092.safetensors", + "model.layers.4.self_attn.k_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.self_attn.k_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.self_attn.o_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.self_attn.o_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.self_attn.q_norm.weight": "model-00005-of-00092.safetensors", + "model.layers.4.self_attn.q_proj.bias": "model-00005-of-00092.safetensors", + "model.layers.4.self_attn.q_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.self_attn.q_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.4.self_attn.v_proj.bias": "model-00005-of-00092.safetensors", + "model.layers.4.self_attn.v_proj.weight": "model-00005-of-00092.safetensors", + "model.layers.4.self_attn.v_proj.weight_scale": "model-00005-of-00092.safetensors", + "model.layers.5.input_layernorm.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.0.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.0.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.0.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.0.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.0.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.0.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.1.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.1.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.1.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.1.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.1.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.1.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.10.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.10.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.10.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.10.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.10.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.10.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.100.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.100.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.100.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.100.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.100.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.100.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.101.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.101.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.101.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.101.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.101.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.101.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.102.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.102.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.102.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.102.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.102.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.102.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.103.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.103.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.103.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.103.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.103.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.103.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.104.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.104.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.104.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.104.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.104.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.104.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.105.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.105.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.105.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.105.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.105.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.105.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.106.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.106.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.106.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.106.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.106.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.106.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.107.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.107.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.107.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.107.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.107.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.107.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.108.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.108.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.108.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.108.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.108.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.108.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.109.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.109.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.109.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.109.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.109.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.109.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.11.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.11.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.11.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.11.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.11.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.11.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.110.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.110.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.110.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.110.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.110.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.110.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.111.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.111.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.111.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.111.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.111.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.111.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.112.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.112.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.112.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.112.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.112.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.112.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.113.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.113.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.113.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.113.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.113.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.113.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.114.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.114.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.114.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.114.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.114.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.114.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.115.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.115.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.115.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.115.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.115.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.115.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.116.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.116.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.116.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.116.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.116.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.116.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.117.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.117.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.117.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.117.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.117.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.117.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.118.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.118.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.118.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.118.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.118.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.118.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.119.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.119.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.119.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.119.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.119.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.119.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.12.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.12.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.12.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.12.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.12.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.12.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.120.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.120.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.120.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.120.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.120.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.120.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.121.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.121.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.121.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.121.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.121.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.121.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.122.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.122.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.122.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.122.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.122.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.122.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.123.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.123.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.123.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.123.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.123.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.123.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.124.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.124.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.124.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.124.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.124.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.124.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.125.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.125.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.125.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.125.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.125.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.125.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.126.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.126.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.126.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.126.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.126.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.126.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.127.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.127.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.127.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.127.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.127.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.127.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.128.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.128.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.128.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.128.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.128.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.128.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.129.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.129.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.129.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.129.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.129.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.129.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.13.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.13.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.13.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.13.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.13.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.13.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.130.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.130.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.130.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.130.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.130.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.130.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.131.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.131.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.131.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.131.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.131.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.131.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.132.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.132.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.132.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.132.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.132.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.132.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.133.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.133.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.133.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.133.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.133.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.133.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.134.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.134.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.134.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.134.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.134.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.134.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.135.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.135.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.135.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.135.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.135.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.135.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.136.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.136.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.136.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.136.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.136.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.136.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.137.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.137.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.137.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.137.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.137.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.137.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.138.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.138.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.138.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.138.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.138.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.138.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.139.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.139.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.139.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.139.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.139.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.139.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.14.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.14.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.14.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.14.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.14.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.14.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.140.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.140.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.140.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.140.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.140.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.140.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.141.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.141.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.141.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.141.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.141.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.141.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.142.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.142.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.142.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.142.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.142.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.142.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.143.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.143.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.143.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.143.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.143.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.143.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.144.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.144.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.144.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.144.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.144.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.144.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.145.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.145.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.145.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.145.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.145.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.145.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.146.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.146.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.146.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.146.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.146.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.146.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.147.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.147.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.147.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.147.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.147.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.147.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.148.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.148.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.148.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.148.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.148.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.148.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.149.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.149.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.149.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.149.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.149.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.149.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.15.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.15.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.15.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.15.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.15.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.15.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.150.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.150.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.150.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.150.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.150.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.150.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.151.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.151.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.151.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.151.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.151.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.151.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.152.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.152.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.152.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.152.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.152.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.152.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.153.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.153.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.153.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.153.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.153.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.153.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.154.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.154.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.154.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.154.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.154.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.154.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.155.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.155.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.155.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.155.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.155.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.155.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.156.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.156.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.156.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.156.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.156.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.156.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.157.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.157.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.157.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.157.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.157.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.157.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.158.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.158.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.158.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.158.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.158.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.158.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.159.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.159.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.159.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.159.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.159.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.159.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.16.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.16.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.16.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.16.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.16.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.16.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.17.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.17.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.17.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.17.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.17.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.17.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.18.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.18.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.18.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.18.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.18.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.18.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.19.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.19.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.19.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.19.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.19.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.19.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.2.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.2.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.2.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.2.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.2.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.2.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.20.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.20.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.20.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.20.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.20.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.20.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.21.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.21.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.21.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.21.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.21.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.21.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.22.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.22.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.22.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.22.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.22.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.22.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.23.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.23.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.23.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.23.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.23.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.23.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.24.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.24.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.24.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.24.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.24.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.24.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.25.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.25.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.25.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.25.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.25.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.25.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.26.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.26.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.26.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.26.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.26.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.26.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.27.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.27.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.27.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.27.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.27.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.27.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.28.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.28.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.28.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.28.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.28.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.28.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.29.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.29.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.29.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.29.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.29.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.29.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.3.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.3.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.3.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.3.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.3.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.3.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.30.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.30.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.30.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.30.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.30.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.30.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.31.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.31.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.31.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.31.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.31.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.31.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.32.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.32.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.32.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.32.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.32.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.32.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.33.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.33.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.33.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.33.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.33.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.33.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.34.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.34.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.34.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.34.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.34.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.34.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.35.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.35.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.35.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.35.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.35.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.35.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.36.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.36.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.36.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.36.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.36.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.36.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.37.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.37.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.37.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.37.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.37.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.37.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.38.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.38.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.38.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.38.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.38.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.38.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.39.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.39.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.39.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.39.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.39.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.39.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.4.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.4.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.4.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.4.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.4.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.4.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.40.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.40.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.40.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.40.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.40.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.40.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.41.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.41.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.41.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.41.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.41.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.41.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.42.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.42.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.42.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.42.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.42.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.42.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.43.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.43.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.43.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.43.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.43.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.43.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.44.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.44.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.44.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.44.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.44.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.44.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.45.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.45.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.45.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.45.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.45.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.45.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.46.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.46.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.46.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.46.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.46.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.46.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.47.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.47.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.47.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.47.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.47.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.47.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.48.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.48.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.48.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.48.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.48.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.48.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.49.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.49.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.49.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.49.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.49.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.49.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.5.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.5.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.5.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.5.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.5.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.5.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.50.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.50.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.50.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.50.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.50.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.50.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.51.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.51.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.51.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.51.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.51.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.51.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.52.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.52.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.52.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.52.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.52.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.52.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.53.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.53.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.53.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.53.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.53.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.53.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.54.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.54.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.54.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.54.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.54.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.54.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.55.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.55.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.55.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.55.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.55.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.55.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.56.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.56.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.56.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.56.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.56.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.56.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.57.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.57.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.57.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.57.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.57.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.57.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.58.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.58.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.58.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.58.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.58.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.58.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.59.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.59.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.59.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.59.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.59.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.59.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.6.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.6.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.6.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.6.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.6.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.6.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.60.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.60.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.60.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.60.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.60.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.60.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.61.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.61.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.61.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.61.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.61.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.61.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.62.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.62.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.62.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.62.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.62.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.62.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.63.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.63.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.63.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.63.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.63.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.63.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.64.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.64.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.64.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.64.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.64.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.64.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.65.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.65.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.65.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.65.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.65.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.65.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.66.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.66.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.66.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.66.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.66.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.66.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.67.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.67.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.67.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.67.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.67.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.67.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.68.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.68.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.68.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.68.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.68.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.68.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.69.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.69.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.69.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.69.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.69.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.69.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.7.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.7.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.7.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.7.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.7.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.7.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.70.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.70.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.70.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.70.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.70.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.70.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.71.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.71.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.71.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.71.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.71.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.71.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.72.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.72.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.72.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.72.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.72.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.72.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.73.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.73.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.73.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.73.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.73.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.73.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.74.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.74.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.74.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.74.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.74.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.74.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.75.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.75.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.75.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.75.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.75.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.75.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.76.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.76.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.76.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.76.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.76.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.76.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.77.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.77.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.77.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.77.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.77.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.77.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.78.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.78.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.78.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.78.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.78.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.78.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.79.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.79.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.79.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.79.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.79.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.79.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.8.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.8.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.8.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.8.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.8.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.8.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.80.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.80.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.80.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.80.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.80.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.80.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.81.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.81.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.81.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.81.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.81.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.81.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.82.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.82.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.82.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.82.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.82.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.82.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.83.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.83.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.83.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.83.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.83.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.83.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.84.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.84.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.84.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.84.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.84.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.84.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.85.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.85.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.85.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.85.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.85.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.85.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.86.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.86.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.86.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.86.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.86.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.86.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.87.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.87.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.87.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.87.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.87.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.87.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.88.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.88.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.88.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.88.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.88.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.88.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.89.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.89.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.89.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.89.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.89.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.89.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.9.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.9.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.9.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.9.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.9.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.9.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.90.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.90.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.90.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.90.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.90.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.90.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.91.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.91.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.91.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.91.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.91.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.91.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.92.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.92.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.92.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.92.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.92.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.92.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.93.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.93.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.93.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.93.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.93.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.93.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.94.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.94.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.94.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.94.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.94.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.94.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.95.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.95.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.95.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.95.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.95.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.95.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.96.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.96.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.96.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.96.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.96.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.96.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.97.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.97.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.97.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.97.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.97.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.97.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.98.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.98.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.98.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.98.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.98.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.98.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.99.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.99.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.99.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.99.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.99.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.experts.99.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.gate.e_score_correction_bias": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.gate.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.shared_experts.down_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.shared_experts.down_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.shared_experts.gate_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.shared_experts.gate_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.shared_experts.up_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.mlp.shared_experts.up_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.post_attention_layernorm.weight": "model-00006-of-00092.safetensors", + "model.layers.5.self_attn.k_norm.weight": "model-00006-of-00092.safetensors", + "model.layers.5.self_attn.k_proj.bias": "model-00006-of-00092.safetensors", + "model.layers.5.self_attn.k_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.self_attn.k_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.self_attn.o_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.self_attn.o_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.self_attn.q_norm.weight": "model-00006-of-00092.safetensors", + "model.layers.5.self_attn.q_proj.bias": "model-00006-of-00092.safetensors", + "model.layers.5.self_attn.q_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.self_attn.q_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.5.self_attn.v_proj.bias": "model-00006-of-00092.safetensors", + "model.layers.5.self_attn.v_proj.weight": "model-00006-of-00092.safetensors", + "model.layers.5.self_attn.v_proj.weight_scale": "model-00006-of-00092.safetensors", + "model.layers.6.input_layernorm.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.0.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.0.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.0.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.0.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.0.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.0.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.1.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.1.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.1.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.1.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.1.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.1.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.10.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.10.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.10.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.10.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.10.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.10.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.100.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.100.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.100.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.100.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.100.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.100.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.101.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.101.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.101.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.101.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.101.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.101.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.102.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.102.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.102.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.102.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.102.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.102.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.103.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.103.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.103.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.103.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.103.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.103.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.104.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.104.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.104.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.104.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.104.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.104.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.105.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.105.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.105.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.105.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.105.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.105.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.106.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.106.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.106.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.106.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.106.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.106.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.107.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.107.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.107.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.107.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.107.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.107.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.108.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.108.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.108.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.108.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.108.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.108.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.109.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.109.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.109.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.109.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.109.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.109.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.11.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.11.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.11.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.11.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.11.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.11.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.110.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.110.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.110.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.110.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.110.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.110.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.111.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.111.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.111.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.111.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.111.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.111.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.112.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.112.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.112.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.112.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.112.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.112.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.113.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.113.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.113.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.113.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.113.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.113.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.114.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.114.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.114.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.114.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.114.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.114.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.115.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.115.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.115.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.115.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.115.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.115.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.116.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.116.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.116.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.116.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.116.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.116.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.117.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.117.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.117.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.117.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.117.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.117.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.118.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.118.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.118.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.118.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.118.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.118.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.119.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.119.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.119.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.119.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.119.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.119.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.12.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.12.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.12.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.12.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.12.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.12.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.120.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.120.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.120.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.120.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.120.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.120.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.121.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.121.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.121.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.121.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.121.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.121.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.122.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.122.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.122.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.122.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.122.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.122.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.123.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.123.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.123.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.123.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.123.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.123.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.124.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.124.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.124.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.124.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.124.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.124.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.125.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.125.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.125.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.125.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.125.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.125.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.126.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.126.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.126.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.126.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.126.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.126.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.127.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.127.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.127.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.127.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.127.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.127.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.128.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.128.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.128.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.128.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.128.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.128.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.129.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.129.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.129.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.129.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.129.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.129.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.13.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.13.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.13.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.13.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.13.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.13.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.130.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.130.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.130.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.130.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.130.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.130.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.131.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.131.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.131.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.131.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.131.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.131.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.132.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.132.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.132.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.132.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.132.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.132.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.133.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.133.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.133.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.133.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.133.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.133.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.134.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.134.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.134.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.134.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.134.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.134.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.135.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.135.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.135.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.135.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.135.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.135.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.136.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.136.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.136.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.136.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.136.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.136.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.137.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.137.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.137.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.137.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.137.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.137.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.138.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.138.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.138.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.138.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.138.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.138.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.139.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.139.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.139.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.139.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.139.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.139.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.14.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.14.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.14.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.14.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.14.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.14.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.140.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.140.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.140.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.140.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.140.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.140.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.141.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.141.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.141.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.141.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.141.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.141.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.142.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.142.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.142.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.142.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.142.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.142.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.143.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.143.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.143.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.143.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.143.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.143.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.144.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.144.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.144.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.144.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.144.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.144.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.145.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.145.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.145.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.145.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.145.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.145.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.146.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.146.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.146.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.146.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.146.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.146.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.147.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.147.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.147.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.147.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.147.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.147.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.148.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.148.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.148.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.148.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.148.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.148.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.149.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.149.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.149.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.149.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.149.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.149.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.15.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.15.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.15.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.15.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.15.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.15.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.150.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.150.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.150.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.150.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.150.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.150.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.151.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.151.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.151.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.151.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.151.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.151.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.152.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.152.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.152.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.152.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.152.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.152.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.153.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.153.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.153.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.153.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.153.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.153.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.154.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.154.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.154.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.154.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.154.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.154.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.155.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.155.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.155.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.155.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.155.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.155.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.156.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.156.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.156.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.156.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.156.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.156.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.157.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.157.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.157.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.157.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.157.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.157.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.158.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.158.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.158.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.158.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.158.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.158.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.159.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.159.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.159.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.159.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.159.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.159.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.16.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.16.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.16.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.16.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.16.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.16.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.17.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.17.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.17.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.17.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.17.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.17.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.18.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.18.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.18.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.18.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.18.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.18.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.19.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.19.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.19.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.19.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.19.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.19.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.2.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.2.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.2.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.2.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.2.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.2.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.20.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.20.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.20.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.20.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.20.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.20.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.21.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.21.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.21.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.21.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.21.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.21.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.22.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.22.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.22.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.22.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.22.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.22.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.23.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.23.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.23.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.23.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.23.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.23.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.24.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.24.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.24.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.24.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.24.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.24.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.25.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.25.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.25.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.25.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.25.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.25.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.26.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.26.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.26.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.26.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.26.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.26.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.27.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.27.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.27.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.27.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.27.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.27.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.28.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.28.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.28.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.28.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.28.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.28.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.29.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.29.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.29.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.29.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.29.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.29.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.3.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.3.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.3.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.3.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.3.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.3.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.30.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.30.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.30.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.30.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.30.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.30.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.31.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.31.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.31.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.31.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.31.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.31.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.32.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.32.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.32.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.32.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.32.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.32.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.33.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.33.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.33.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.33.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.33.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.33.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.34.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.34.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.34.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.34.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.34.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.34.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.35.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.35.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.35.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.35.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.35.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.35.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.36.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.36.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.36.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.36.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.36.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.36.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.37.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.37.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.37.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.37.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.37.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.37.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.38.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.38.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.38.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.38.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.38.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.38.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.39.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.39.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.39.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.39.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.39.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.39.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.4.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.4.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.4.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.4.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.4.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.4.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.40.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.40.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.40.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.40.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.40.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.40.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.41.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.41.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.41.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.41.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.41.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.41.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.42.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.42.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.42.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.42.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.42.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.42.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.43.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.43.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.43.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.43.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.43.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.43.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.44.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.44.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.44.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.44.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.44.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.44.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.45.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.45.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.45.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.45.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.45.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.45.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.46.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.46.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.46.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.46.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.46.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.46.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.47.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.47.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.47.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.47.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.47.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.47.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.48.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.48.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.48.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.48.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.48.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.48.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.49.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.49.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.49.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.49.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.49.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.49.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.5.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.5.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.5.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.5.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.5.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.5.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.50.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.50.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.50.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.50.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.50.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.50.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.51.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.51.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.51.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.51.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.51.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.51.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.52.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.52.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.52.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.52.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.52.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.52.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.53.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.53.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.53.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.53.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.53.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.53.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.54.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.54.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.54.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.54.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.54.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.54.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.55.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.55.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.55.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.55.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.55.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.55.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.56.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.56.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.56.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.56.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.56.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.56.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.57.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.57.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.57.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.57.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.57.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.57.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.58.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.58.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.58.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.58.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.58.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.58.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.59.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.59.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.59.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.59.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.59.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.59.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.6.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.6.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.6.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.6.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.6.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.6.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.60.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.60.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.60.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.60.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.60.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.60.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.61.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.61.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.61.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.61.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.61.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.61.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.62.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.62.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.62.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.62.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.62.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.62.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.63.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.63.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.63.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.63.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.63.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.63.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.64.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.64.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.64.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.64.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.64.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.64.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.65.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.65.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.65.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.65.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.65.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.65.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.66.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.66.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.66.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.66.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.66.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.66.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.67.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.67.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.67.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.67.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.67.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.67.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.68.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.68.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.68.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.68.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.68.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.68.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.69.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.69.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.69.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.69.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.69.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.69.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.7.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.7.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.7.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.7.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.7.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.7.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.70.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.70.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.70.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.70.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.70.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.70.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.71.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.71.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.71.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.71.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.71.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.71.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.72.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.72.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.72.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.72.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.72.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.72.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.73.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.73.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.73.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.73.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.73.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.73.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.74.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.74.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.74.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.74.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.74.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.74.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.75.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.75.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.75.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.75.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.75.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.75.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.76.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.76.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.76.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.76.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.76.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.76.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.77.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.77.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.77.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.77.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.77.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.77.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.78.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.78.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.78.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.78.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.78.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.78.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.79.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.79.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.79.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.79.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.79.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.79.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.8.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.8.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.8.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.8.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.8.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.8.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.80.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.80.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.80.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.80.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.80.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.80.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.81.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.81.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.81.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.81.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.81.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.81.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.82.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.82.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.82.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.82.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.82.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.82.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.83.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.83.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.83.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.83.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.83.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.83.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.84.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.84.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.84.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.84.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.84.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.84.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.85.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.85.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.85.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.85.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.85.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.85.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.86.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.86.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.86.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.86.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.86.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.86.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.87.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.87.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.87.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.87.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.87.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.87.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.88.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.88.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.88.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.88.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.88.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.88.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.89.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.89.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.89.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.89.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.89.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.89.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.9.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.9.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.9.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.9.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.9.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.9.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.90.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.90.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.90.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.90.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.90.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.90.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.91.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.91.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.91.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.91.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.91.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.91.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.92.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.92.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.92.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.92.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.92.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.92.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.93.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.93.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.93.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.93.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.93.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.93.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.94.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.94.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.94.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.94.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.94.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.94.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.95.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.95.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.95.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.95.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.95.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.95.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.96.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.96.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.96.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.96.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.96.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.96.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.97.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.97.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.97.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.97.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.97.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.97.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.98.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.98.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.98.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.98.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.98.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.98.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.99.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.99.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.99.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.99.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.99.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.experts.99.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.gate.e_score_correction_bias": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.gate.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.shared_experts.down_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.shared_experts.down_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.shared_experts.gate_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.shared_experts.gate_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.shared_experts.up_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.mlp.shared_experts.up_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.post_attention_layernorm.weight": "model-00007-of-00092.safetensors", + "model.layers.6.self_attn.k_norm.weight": "model-00007-of-00092.safetensors", + "model.layers.6.self_attn.k_proj.bias": "model-00007-of-00092.safetensors", + "model.layers.6.self_attn.k_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.self_attn.k_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.self_attn.o_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.self_attn.o_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.self_attn.q_norm.weight": "model-00007-of-00092.safetensors", + "model.layers.6.self_attn.q_proj.bias": "model-00007-of-00092.safetensors", + "model.layers.6.self_attn.q_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.self_attn.q_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.6.self_attn.v_proj.bias": "model-00007-of-00092.safetensors", + "model.layers.6.self_attn.v_proj.weight": "model-00007-of-00092.safetensors", + "model.layers.6.self_attn.v_proj.weight_scale": "model-00007-of-00092.safetensors", + "model.layers.7.input_layernorm.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.0.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.0.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.0.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.0.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.0.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.0.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.1.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.1.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.1.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.1.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.1.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.1.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.10.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.10.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.10.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.10.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.10.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.10.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.100.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.100.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.100.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.100.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.100.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.100.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.101.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.101.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.101.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.101.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.101.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.101.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.102.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.102.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.102.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.102.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.102.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.102.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.103.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.103.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.103.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.103.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.103.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.103.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.104.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.104.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.104.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.104.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.104.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.104.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.105.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.105.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.105.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.105.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.105.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.105.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.106.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.106.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.106.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.106.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.106.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.106.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.107.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.107.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.107.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.107.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.107.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.107.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.108.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.108.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.108.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.108.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.108.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.108.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.109.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.109.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.109.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.109.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.109.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.109.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.11.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.11.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.11.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.11.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.11.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.11.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.110.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.110.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.110.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.110.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.110.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.110.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.111.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.111.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.111.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.111.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.111.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.111.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.112.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.112.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.112.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.112.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.112.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.112.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.113.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.113.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.113.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.113.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.113.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.113.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.114.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.114.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.114.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.114.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.114.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.114.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.115.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.115.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.115.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.115.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.115.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.115.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.116.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.116.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.116.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.116.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.116.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.116.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.117.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.117.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.117.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.117.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.117.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.117.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.118.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.118.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.118.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.118.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.118.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.118.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.119.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.119.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.119.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.119.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.119.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.119.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.12.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.12.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.12.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.12.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.12.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.12.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.120.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.120.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.120.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.120.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.120.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.120.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.121.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.121.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.121.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.121.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.121.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.121.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.122.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.122.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.122.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.122.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.122.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.122.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.123.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.123.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.123.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.123.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.123.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.123.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.124.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.124.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.124.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.124.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.124.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.124.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.125.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.125.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.125.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.125.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.125.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.125.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.126.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.126.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.126.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.126.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.126.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.126.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.127.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.127.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.127.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.127.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.127.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.127.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.128.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.128.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.128.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.128.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.128.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.128.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.129.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.129.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.129.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.129.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.129.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.129.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.13.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.13.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.13.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.13.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.13.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.13.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.130.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.130.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.130.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.130.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.130.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.130.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.131.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.131.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.131.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.131.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.131.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.131.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.132.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.132.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.132.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.132.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.132.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.132.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.133.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.133.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.133.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.133.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.133.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.133.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.134.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.134.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.134.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.134.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.134.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.134.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.135.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.135.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.135.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.135.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.135.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.135.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.136.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.136.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.136.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.136.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.136.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.136.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.137.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.137.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.137.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.137.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.137.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.137.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.138.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.138.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.138.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.138.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.138.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.138.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.139.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.139.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.139.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.139.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.139.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.139.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.14.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.14.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.14.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.14.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.14.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.14.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.140.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.140.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.140.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.140.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.140.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.140.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.141.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.141.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.141.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.141.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.141.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.141.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.142.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.142.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.142.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.142.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.142.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.142.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.143.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.143.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.143.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.143.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.143.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.143.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.144.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.144.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.144.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.144.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.144.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.144.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.145.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.145.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.145.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.145.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.145.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.145.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.146.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.146.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.146.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.146.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.146.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.146.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.147.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.147.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.147.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.147.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.147.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.147.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.148.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.148.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.148.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.148.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.148.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.148.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.149.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.149.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.149.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.149.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.149.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.149.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.15.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.15.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.15.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.15.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.15.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.15.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.150.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.150.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.150.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.150.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.150.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.150.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.151.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.151.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.151.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.151.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.151.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.151.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.152.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.152.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.152.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.152.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.152.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.152.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.153.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.153.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.153.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.153.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.153.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.153.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.154.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.154.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.154.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.154.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.154.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.154.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.155.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.155.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.155.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.155.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.155.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.155.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.156.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.156.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.156.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.156.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.156.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.156.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.157.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.157.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.157.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.157.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.157.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.157.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.158.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.158.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.158.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.158.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.158.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.158.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.159.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.159.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.159.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.159.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.159.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.159.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.16.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.16.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.16.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.16.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.16.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.16.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.17.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.17.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.17.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.17.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.17.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.17.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.18.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.18.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.18.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.18.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.18.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.18.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.19.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.19.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.19.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.19.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.19.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.19.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.2.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.2.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.2.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.2.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.2.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.2.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.20.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.20.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.20.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.20.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.20.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.20.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.21.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.21.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.21.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.21.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.21.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.21.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.22.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.22.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.22.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.22.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.22.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.22.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.23.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.23.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.23.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.23.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.23.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.23.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.24.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.24.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.24.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.24.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.24.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.24.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.25.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.25.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.25.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.25.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.25.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.25.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.26.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.26.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.26.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.26.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.26.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.26.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.27.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.27.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.27.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.27.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.27.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.27.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.28.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.28.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.28.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.28.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.28.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.28.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.29.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.29.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.29.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.29.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.29.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.29.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.3.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.3.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.3.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.3.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.3.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.3.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.30.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.30.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.30.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.30.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.30.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.30.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.31.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.31.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.31.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.31.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.31.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.31.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.32.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.32.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.32.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.32.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.32.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.32.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.33.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.33.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.33.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.33.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.33.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.33.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.34.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.34.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.34.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.34.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.34.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.34.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.35.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.35.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.35.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.35.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.35.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.35.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.36.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.36.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.36.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.36.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.36.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.36.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.37.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.37.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.37.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.37.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.37.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.37.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.38.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.38.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.38.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.38.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.38.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.38.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.39.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.39.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.39.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.39.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.39.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.39.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.4.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.4.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.4.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.4.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.4.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.4.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.40.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.40.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.40.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.40.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.40.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.40.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.41.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.41.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.41.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.41.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.41.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.41.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.42.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.42.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.42.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.42.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.42.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.42.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.43.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.43.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.43.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.43.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.43.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.43.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.44.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.44.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.44.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.44.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.44.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.44.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.45.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.45.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.45.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.45.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.45.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.45.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.46.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.46.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.46.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.46.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.46.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.46.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.47.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.47.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.47.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.47.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.47.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.47.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.48.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.48.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.48.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.48.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.48.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.48.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.49.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.49.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.49.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.49.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.49.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.49.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.5.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.5.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.5.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.5.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.5.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.5.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.50.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.50.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.50.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.50.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.50.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.50.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.51.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.51.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.51.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.51.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.51.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.51.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.52.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.52.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.52.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.52.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.52.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.52.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.53.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.53.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.53.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.53.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.53.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.53.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.54.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.54.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.54.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.54.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.54.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.54.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.55.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.55.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.55.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.55.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.55.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.55.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.56.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.56.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.56.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.56.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.56.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.56.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.57.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.57.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.57.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.57.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.57.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.57.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.58.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.58.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.58.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.58.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.58.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.58.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.59.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.59.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.59.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.59.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.59.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.59.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.6.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.6.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.6.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.6.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.6.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.6.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.60.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.60.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.60.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.60.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.60.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.60.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.61.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.61.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.61.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.61.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.61.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.61.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.62.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.62.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.62.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.62.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.62.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.62.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.63.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.63.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.63.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.63.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.63.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.63.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.64.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.64.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.64.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.64.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.64.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.64.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.65.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.65.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.65.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.65.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.65.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.65.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.66.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.66.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.66.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.66.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.66.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.66.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.67.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.67.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.67.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.67.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.67.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.67.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.68.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.68.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.68.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.68.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.68.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.68.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.69.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.69.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.69.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.69.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.69.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.69.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.7.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.7.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.7.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.7.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.7.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.7.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.70.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.70.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.70.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.70.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.70.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.70.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.71.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.71.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.71.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.71.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.71.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.71.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.72.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.72.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.72.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.72.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.72.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.72.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.73.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.73.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.73.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.73.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.73.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.73.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.74.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.74.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.74.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.74.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.74.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.74.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.75.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.75.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.75.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.75.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.75.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.75.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.76.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.76.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.76.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.76.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.76.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.76.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.77.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.77.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.77.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.77.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.77.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.77.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.78.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.78.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.78.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.78.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.78.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.78.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.79.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.79.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.79.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.79.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.79.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.79.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.8.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.8.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.8.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.8.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.8.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.8.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.80.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.80.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.80.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.80.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.80.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.80.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.81.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.81.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.81.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.81.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.81.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.81.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.82.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.82.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.82.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.82.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.82.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.82.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.83.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.83.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.83.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.83.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.83.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.83.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.84.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.84.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.84.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.84.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.84.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.84.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.85.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.85.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.85.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.85.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.85.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.85.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.86.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.86.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.86.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.86.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.86.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.86.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.87.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.87.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.87.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.87.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.87.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.87.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.88.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.88.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.88.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.88.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.88.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.88.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.89.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.89.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.89.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.89.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.89.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.89.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.9.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.9.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.9.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.9.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.9.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.9.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.90.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.90.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.90.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.90.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.90.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.90.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.91.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.91.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.91.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.91.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.91.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.91.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.92.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.92.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.92.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.92.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.92.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.92.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.93.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.93.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.93.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.93.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.93.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.93.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.94.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.94.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.94.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.94.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.94.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.94.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.95.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.95.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.95.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.95.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.95.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.95.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.96.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.96.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.96.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.96.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.96.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.96.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.97.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.97.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.97.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.97.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.97.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.97.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.98.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.98.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.98.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.98.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.98.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.98.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.99.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.99.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.99.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.99.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.99.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.experts.99.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.gate.e_score_correction_bias": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.gate.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.shared_experts.down_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.shared_experts.down_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.shared_experts.gate_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.shared_experts.gate_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.shared_experts.up_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.mlp.shared_experts.up_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.post_attention_layernorm.weight": "model-00008-of-00092.safetensors", + "model.layers.7.self_attn.k_norm.weight": "model-00008-of-00092.safetensors", + "model.layers.7.self_attn.k_proj.bias": "model-00008-of-00092.safetensors", + "model.layers.7.self_attn.k_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.self_attn.k_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.self_attn.o_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.self_attn.o_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.self_attn.q_norm.weight": "model-00008-of-00092.safetensors", + "model.layers.7.self_attn.q_proj.bias": "model-00008-of-00092.safetensors", + "model.layers.7.self_attn.q_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.self_attn.q_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.7.self_attn.v_proj.bias": "model-00008-of-00092.safetensors", + "model.layers.7.self_attn.v_proj.weight": "model-00008-of-00092.safetensors", + "model.layers.7.self_attn.v_proj.weight_scale": "model-00008-of-00092.safetensors", + "model.layers.8.input_layernorm.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.0.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.0.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.0.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.0.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.0.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.0.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.1.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.1.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.1.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.1.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.1.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.1.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.10.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.10.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.10.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.10.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.10.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.10.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.100.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.100.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.100.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.100.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.100.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.100.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.101.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.101.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.101.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.101.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.101.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.101.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.102.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.102.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.102.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.102.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.102.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.102.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.103.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.103.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.103.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.103.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.103.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.103.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.104.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.104.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.104.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.104.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.104.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.104.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.105.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.105.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.105.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.105.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.105.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.105.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.106.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.106.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.106.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.106.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.106.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.106.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.107.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.107.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.107.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.107.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.107.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.107.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.108.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.108.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.108.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.108.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.108.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.108.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.109.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.109.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.109.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.109.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.109.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.109.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.11.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.11.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.11.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.11.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.11.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.11.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.110.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.110.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.110.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.110.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.110.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.110.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.111.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.111.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.111.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.111.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.111.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.111.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.112.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.112.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.112.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.112.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.112.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.112.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.113.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.113.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.113.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.113.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.113.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.113.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.114.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.114.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.114.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.114.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.114.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.114.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.115.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.115.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.115.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.115.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.115.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.115.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.116.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.116.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.116.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.116.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.116.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.116.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.117.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.117.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.117.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.117.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.117.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.117.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.118.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.118.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.118.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.118.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.118.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.118.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.119.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.119.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.119.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.119.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.119.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.119.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.12.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.12.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.12.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.12.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.12.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.12.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.120.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.120.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.120.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.120.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.120.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.120.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.121.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.121.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.121.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.121.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.121.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.121.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.122.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.122.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.122.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.122.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.122.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.122.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.123.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.123.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.123.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.123.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.123.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.123.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.124.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.124.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.124.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.124.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.124.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.124.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.125.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.125.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.125.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.125.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.125.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.125.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.126.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.126.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.126.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.126.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.126.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.126.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.127.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.127.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.127.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.127.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.127.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.127.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.128.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.128.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.128.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.128.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.128.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.128.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.129.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.129.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.129.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.129.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.129.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.129.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.13.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.13.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.13.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.13.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.13.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.13.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.130.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.130.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.130.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.130.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.130.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.130.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.131.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.131.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.131.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.131.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.131.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.131.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.132.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.132.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.132.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.132.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.132.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.132.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.133.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.133.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.133.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.133.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.133.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.133.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.134.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.134.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.134.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.134.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.134.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.134.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.135.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.135.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.135.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.135.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.135.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.135.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.136.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.136.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.136.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.136.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.136.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.136.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.137.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.137.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.137.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.137.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.137.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.137.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.138.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.138.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.138.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.138.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.138.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.138.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.139.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.139.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.139.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.139.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.139.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.139.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.14.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.14.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.14.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.14.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.14.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.14.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.140.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.140.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.140.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.140.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.140.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.140.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.141.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.141.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.141.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.141.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.141.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.141.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.142.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.142.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.142.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.142.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.142.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.142.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.143.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.143.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.143.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.143.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.143.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.143.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.144.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.144.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.144.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.144.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.144.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.144.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.145.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.145.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.145.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.145.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.145.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.145.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.146.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.146.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.146.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.146.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.146.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.146.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.147.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.147.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.147.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.147.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.147.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.147.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.148.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.148.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.148.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.148.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.148.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.148.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.149.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.149.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.149.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.149.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.149.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.149.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.15.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.15.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.15.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.15.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.15.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.15.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.150.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.150.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.150.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.150.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.150.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.150.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.151.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.151.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.151.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.151.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.151.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.151.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.152.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.152.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.152.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.152.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.152.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.152.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.153.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.153.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.153.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.153.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.153.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.153.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.154.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.154.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.154.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.154.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.154.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.154.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.155.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.155.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.155.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.155.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.155.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.155.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.156.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.156.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.156.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.156.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.156.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.156.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.157.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.157.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.157.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.157.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.157.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.157.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.158.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.158.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.158.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.158.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.158.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.158.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.159.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.159.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.159.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.159.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.159.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.159.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.16.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.16.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.16.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.16.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.16.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.16.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.17.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.17.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.17.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.17.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.17.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.17.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.18.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.18.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.18.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.18.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.18.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.18.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.19.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.19.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.19.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.19.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.19.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.19.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.2.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.2.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.2.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.2.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.2.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.2.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.20.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.20.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.20.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.20.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.20.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.20.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.21.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.21.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.21.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.21.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.21.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.21.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.22.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.22.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.22.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.22.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.22.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.22.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.23.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.23.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.23.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.23.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.23.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.23.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.24.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.24.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.24.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.24.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.24.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.24.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.25.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.25.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.25.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.25.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.25.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.25.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.26.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.26.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.26.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.26.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.26.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.26.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.27.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.27.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.27.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.27.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.27.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.27.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.28.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.28.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.28.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.28.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.28.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.28.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.29.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.29.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.29.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.29.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.29.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.29.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.3.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.3.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.3.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.3.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.3.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.3.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.30.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.30.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.30.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.30.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.30.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.30.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.31.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.31.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.31.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.31.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.31.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.31.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.32.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.32.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.32.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.32.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.32.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.32.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.33.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.33.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.33.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.33.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.33.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.33.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.34.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.34.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.34.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.34.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.34.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.34.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.35.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.35.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.35.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.35.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.35.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.35.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.36.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.36.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.36.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.36.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.36.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.36.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.37.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.37.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.37.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.37.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.37.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.37.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.38.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.38.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.38.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.38.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.38.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.38.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.39.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.39.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.39.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.39.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.39.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.39.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.4.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.4.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.4.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.4.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.4.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.4.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.40.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.40.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.40.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.40.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.40.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.40.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.41.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.41.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.41.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.41.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.41.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.41.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.42.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.42.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.42.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.42.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.42.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.42.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.43.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.43.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.43.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.43.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.43.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.43.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.44.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.44.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.44.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.44.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.44.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.44.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.45.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.45.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.45.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.45.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.45.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.45.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.46.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.46.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.46.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.46.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.46.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.46.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.47.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.47.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.47.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.47.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.47.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.47.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.48.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.48.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.48.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.48.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.48.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.48.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.49.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.49.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.49.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.49.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.49.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.49.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.5.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.5.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.5.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.5.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.5.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.5.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.50.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.50.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.50.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.50.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.50.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.50.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.51.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.51.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.51.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.51.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.51.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.51.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.52.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.52.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.52.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.52.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.52.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.52.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.53.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.53.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.53.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.53.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.53.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.53.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.54.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.54.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.54.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.54.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.54.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.54.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.55.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.55.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.55.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.55.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.55.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.55.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.56.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.56.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.56.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.56.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.56.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.56.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.57.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.57.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.57.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.57.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.57.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.57.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.58.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.58.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.58.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.58.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.58.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.58.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.59.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.59.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.59.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.59.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.59.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.59.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.6.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.6.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.6.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.6.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.6.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.6.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.60.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.60.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.60.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.60.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.60.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.60.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.61.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.61.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.61.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.61.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.61.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.61.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.62.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.62.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.62.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.62.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.62.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.62.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.63.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.63.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.63.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.63.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.63.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.63.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.64.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.64.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.64.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.64.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.64.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.64.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.65.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.65.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.65.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.65.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.65.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.65.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.66.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.66.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.66.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.66.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.66.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.66.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.67.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.67.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.67.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.67.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.67.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.67.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.68.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.68.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.68.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.68.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.68.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.68.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.69.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.69.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.69.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.69.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.69.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.69.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.7.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.7.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.7.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.7.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.7.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.7.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.70.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.70.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.70.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.70.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.70.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.70.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.71.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.71.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.71.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.71.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.71.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.71.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.72.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.72.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.72.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.72.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.72.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.72.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.73.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.73.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.73.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.73.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.73.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.73.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.74.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.74.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.74.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.74.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.74.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.74.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.75.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.75.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.75.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.75.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.75.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.75.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.76.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.76.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.76.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.76.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.76.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.76.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.77.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.77.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.77.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.77.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.77.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.77.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.78.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.78.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.78.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.78.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.78.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.78.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.79.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.79.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.79.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.79.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.79.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.79.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.8.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.8.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.8.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.8.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.8.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.8.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.80.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.80.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.80.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.80.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.80.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.80.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.81.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.81.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.81.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.81.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.81.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.81.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.82.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.82.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.82.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.82.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.82.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.82.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.83.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.83.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.83.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.83.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.83.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.83.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.84.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.84.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.84.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.84.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.84.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.84.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.85.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.85.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.85.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.85.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.85.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.85.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.86.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.86.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.86.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.86.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.86.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.86.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.87.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.87.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.87.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.87.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.87.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.87.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.88.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.88.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.88.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.88.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.88.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.88.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.89.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.89.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.89.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.89.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.89.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.89.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.9.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.9.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.9.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.9.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.9.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.9.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.90.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.90.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.90.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.90.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.90.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.90.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.91.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.91.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.91.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.91.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.91.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.91.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.92.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.92.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.92.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.92.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.92.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.92.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.93.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.93.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.93.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.93.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.93.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.93.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.94.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.94.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.94.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.94.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.94.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.94.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.95.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.95.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.95.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.95.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.95.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.95.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.96.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.96.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.96.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.96.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.96.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.96.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.97.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.97.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.97.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.97.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.97.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.97.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.98.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.98.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.98.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.98.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.98.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.98.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.99.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.99.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.99.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.99.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.99.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.experts.99.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.gate.e_score_correction_bias": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.gate.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.shared_experts.down_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.shared_experts.down_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.shared_experts.gate_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.shared_experts.gate_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.shared_experts.up_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.mlp.shared_experts.up_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.post_attention_layernorm.weight": "model-00009-of-00092.safetensors", + "model.layers.8.self_attn.k_norm.weight": "model-00009-of-00092.safetensors", + "model.layers.8.self_attn.k_proj.bias": "model-00009-of-00092.safetensors", + "model.layers.8.self_attn.k_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.self_attn.k_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.self_attn.o_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.self_attn.o_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.self_attn.q_norm.weight": "model-00009-of-00092.safetensors", + "model.layers.8.self_attn.q_proj.bias": "model-00009-of-00092.safetensors", + "model.layers.8.self_attn.q_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.self_attn.q_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.8.self_attn.v_proj.bias": "model-00009-of-00092.safetensors", + "model.layers.8.self_attn.v_proj.weight": "model-00009-of-00092.safetensors", + "model.layers.8.self_attn.v_proj.weight_scale": "model-00009-of-00092.safetensors", + "model.layers.9.input_layernorm.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.0.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.0.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.0.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.0.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.0.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.0.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.1.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.1.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.1.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.1.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.1.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.1.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.10.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.10.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.10.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.10.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.10.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.10.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.100.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.100.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.100.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.100.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.100.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.100.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.101.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.101.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.101.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.101.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.101.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.101.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.102.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.102.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.102.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.102.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.102.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.102.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.103.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.103.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.103.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.103.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.103.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.103.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.104.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.104.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.104.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.104.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.104.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.104.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.105.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.105.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.105.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.105.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.105.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.105.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.106.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.106.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.106.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.106.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.106.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.106.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.107.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.107.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.107.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.107.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.107.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.107.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.108.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.108.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.108.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.108.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.108.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.108.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.109.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.109.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.109.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.109.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.109.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.109.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.11.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.11.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.11.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.11.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.11.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.11.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.110.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.110.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.110.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.110.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.110.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.110.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.111.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.111.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.111.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.111.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.111.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.111.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.112.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.112.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.112.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.112.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.112.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.112.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.113.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.113.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.113.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.113.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.113.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.113.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.114.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.114.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.114.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.114.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.114.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.114.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.115.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.115.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.115.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.115.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.115.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.115.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.116.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.116.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.116.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.116.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.116.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.116.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.117.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.117.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.117.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.117.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.117.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.117.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.118.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.118.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.118.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.118.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.118.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.118.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.119.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.119.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.119.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.119.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.119.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.119.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.12.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.12.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.12.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.12.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.12.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.12.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.120.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.120.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.120.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.120.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.120.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.120.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.121.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.121.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.121.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.121.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.121.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.121.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.122.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.122.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.122.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.122.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.122.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.122.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.123.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.123.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.123.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.123.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.123.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.123.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.124.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.124.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.124.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.124.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.124.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.124.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.125.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.125.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.125.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.125.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.125.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.125.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.126.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.126.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.126.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.126.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.126.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.126.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.127.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.127.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.127.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.127.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.127.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.127.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.128.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.128.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.128.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.128.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.128.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.128.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.129.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.129.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.129.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.129.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.129.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.129.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.13.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.13.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.13.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.13.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.13.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.13.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.130.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.130.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.130.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.130.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.130.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.130.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.131.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.131.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.131.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.131.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.131.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.131.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.132.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.132.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.132.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.132.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.132.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.132.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.133.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.133.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.133.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.133.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.133.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.133.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.134.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.134.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.134.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.134.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.134.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.134.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.135.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.135.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.135.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.135.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.135.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.135.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.136.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.136.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.136.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.136.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.136.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.136.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.137.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.137.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.137.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.137.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.137.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.137.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.138.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.138.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.138.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.138.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.138.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.138.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.139.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.139.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.139.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.139.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.139.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.139.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.14.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.14.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.14.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.14.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.14.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.14.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.140.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.140.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.140.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.140.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.140.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.140.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.141.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.141.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.141.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.141.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.141.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.141.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.142.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.142.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.142.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.142.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.142.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.142.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.143.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.143.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.143.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.143.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.143.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.143.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.144.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.144.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.144.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.144.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.144.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.144.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.145.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.145.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.145.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.145.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.145.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.145.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.146.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.146.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.146.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.146.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.146.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.146.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.147.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.147.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.147.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.147.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.147.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.147.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.148.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.148.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.148.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.148.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.148.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.148.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.149.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.149.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.149.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.149.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.149.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.149.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.15.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.15.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.15.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.15.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.15.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.15.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.150.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.150.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.150.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.150.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.150.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.150.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.151.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.151.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.151.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.151.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.151.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.151.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.152.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.152.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.152.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.152.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.152.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.152.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.153.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.153.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.153.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.153.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.153.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.153.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.154.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.154.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.154.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.154.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.154.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.154.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.155.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.155.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.155.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.155.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.155.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.155.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.156.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.156.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.156.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.156.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.156.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.156.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.157.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.157.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.157.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.157.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.157.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.157.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.158.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.158.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.158.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.158.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.158.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.158.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.159.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.159.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.159.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.159.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.159.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.159.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.16.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.16.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.16.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.16.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.16.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.16.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.17.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.17.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.17.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.17.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.17.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.17.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.18.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.18.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.18.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.18.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.18.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.18.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.19.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.19.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.19.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.19.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.19.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.19.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.2.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.2.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.2.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.2.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.2.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.2.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.20.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.20.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.20.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.20.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.20.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.20.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.21.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.21.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.21.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.21.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.21.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.21.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.22.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.22.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.22.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.22.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.22.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.22.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.23.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.23.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.23.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.23.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.23.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.23.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.24.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.24.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.24.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.24.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.24.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.24.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.25.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.25.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.25.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.25.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.25.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.25.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.26.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.26.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.26.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.26.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.26.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.26.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.27.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.27.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.27.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.27.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.27.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.27.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.28.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.28.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.28.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.28.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.28.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.28.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.29.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.29.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.29.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.29.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.29.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.29.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.3.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.3.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.3.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.3.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.3.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.3.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.30.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.30.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.30.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.30.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.30.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.30.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.31.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.31.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.31.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.31.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.31.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.31.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.32.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.32.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.32.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.32.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.32.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.32.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.33.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.33.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.33.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.33.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.33.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.33.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.34.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.34.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.34.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.34.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.34.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.34.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.35.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.35.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.35.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.35.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.35.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.35.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.36.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.36.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.36.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.36.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.36.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.36.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.37.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.37.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.37.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.37.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.37.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.37.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.38.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.38.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.38.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.38.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.38.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.38.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.39.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.39.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.39.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.39.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.39.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.39.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.4.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.4.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.4.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.4.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.4.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.4.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.40.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.40.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.40.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.40.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.40.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.40.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.41.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.41.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.41.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.41.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.41.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.41.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.42.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.42.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.42.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.42.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.42.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.42.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.43.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.43.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.43.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.43.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.43.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.43.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.44.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.44.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.44.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.44.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.44.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.44.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.45.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.45.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.45.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.45.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.45.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.45.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.46.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.46.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.46.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.46.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.46.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.46.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.47.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.47.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.47.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.47.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.47.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.47.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.48.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.48.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.48.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.48.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.48.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.48.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.49.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.49.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.49.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.49.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.49.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.49.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.5.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.5.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.5.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.5.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.5.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.5.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.50.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.50.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.50.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.50.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.50.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.50.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.51.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.51.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.51.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.51.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.51.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.51.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.52.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.52.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.52.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.52.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.52.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.52.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.53.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.53.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.53.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.53.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.53.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.53.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.54.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.54.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.54.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.54.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.54.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.54.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.55.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.55.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.55.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.55.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.55.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.55.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.56.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.56.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.56.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.56.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.56.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.56.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.57.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.57.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.57.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.57.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.57.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.57.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.58.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.58.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.58.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.58.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.58.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.58.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.59.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.59.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.59.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.59.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.59.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.59.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.6.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.6.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.6.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.6.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.6.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.6.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.60.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.60.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.60.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.60.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.60.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.60.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.61.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.61.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.61.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.61.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.61.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.61.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.62.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.62.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.62.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.62.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.62.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.62.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.63.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.63.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.63.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.63.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.63.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.63.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.64.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.64.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.64.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.64.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.64.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.64.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.65.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.65.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.65.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.65.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.65.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.65.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.66.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.66.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.66.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.66.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.66.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.66.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.67.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.67.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.67.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.67.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.67.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.67.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.68.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.68.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.68.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.68.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.68.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.68.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.69.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.69.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.69.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.69.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.69.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.69.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.7.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.7.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.7.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.7.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.7.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.7.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.70.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.70.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.70.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.70.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.70.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.70.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.71.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.71.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.71.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.71.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.71.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.71.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.72.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.72.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.72.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.72.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.72.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.72.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.73.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.73.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.73.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.73.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.73.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.73.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.74.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.74.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.74.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.74.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.74.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.74.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.75.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.75.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.75.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.75.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.75.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.75.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.76.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.76.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.76.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.76.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.76.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.76.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.77.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.77.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.77.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.77.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.77.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.77.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.78.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.78.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.78.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.78.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.78.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.78.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.79.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.79.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.79.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.79.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.79.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.79.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.8.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.8.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.8.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.8.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.8.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.8.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.80.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.80.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.80.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.80.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.80.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.80.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.81.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.81.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.81.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.81.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.81.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.81.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.82.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.82.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.82.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.82.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.82.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.82.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.83.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.83.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.83.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.83.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.83.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.83.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.84.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.84.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.84.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.84.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.84.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.84.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.85.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.85.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.85.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.85.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.85.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.85.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.86.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.86.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.86.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.86.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.86.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.86.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.87.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.87.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.87.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.87.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.87.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.87.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.88.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.88.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.88.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.88.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.88.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.88.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.89.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.89.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.89.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.89.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.89.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.89.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.9.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.9.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.9.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.9.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.9.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.9.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.90.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.90.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.90.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.90.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.90.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.90.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.91.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.91.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.91.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.91.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.91.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.91.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.92.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.92.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.92.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.92.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.92.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.92.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.93.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.93.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.93.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.93.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.93.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.93.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.94.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.94.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.94.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.94.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.94.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.94.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.95.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.95.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.95.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.95.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.95.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.95.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.96.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.96.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.96.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.96.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.96.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.96.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.97.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.97.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.97.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.97.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.97.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.97.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.98.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.98.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.98.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.98.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.98.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.98.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.99.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.99.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.99.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.99.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.99.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.experts.99.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.gate.e_score_correction_bias": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.gate.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.shared_experts.down_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.shared_experts.down_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.shared_experts.gate_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.shared_experts.gate_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.shared_experts.up_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.mlp.shared_experts.up_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.post_attention_layernorm.weight": "model-00010-of-00092.safetensors", + "model.layers.9.self_attn.k_norm.weight": "model-00010-of-00092.safetensors", + "model.layers.9.self_attn.k_proj.bias": "model-00010-of-00092.safetensors", + "model.layers.9.self_attn.k_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.self_attn.k_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.self_attn.o_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.self_attn.o_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.self_attn.q_norm.weight": "model-00010-of-00092.safetensors", + "model.layers.9.self_attn.q_proj.bias": "model-00010-of-00092.safetensors", + "model.layers.9.self_attn.q_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.self_attn.q_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.9.self_attn.v_proj.bias": "model-00010-of-00092.safetensors", + "model.layers.9.self_attn.v_proj.weight": "model-00010-of-00092.safetensors", + "model.layers.9.self_attn.v_proj.weight_scale": "model-00010-of-00092.safetensors", + "model.layers.10.input_layernorm.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.0.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.0.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.0.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.0.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.0.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.0.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.1.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.1.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.1.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.1.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.1.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.1.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.10.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.10.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.10.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.10.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.10.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.10.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.100.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.100.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.100.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.100.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.100.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.100.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.101.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.101.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.101.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.101.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.101.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.101.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.102.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.102.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.102.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.102.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.102.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.102.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.103.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.103.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.103.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.103.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.103.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.103.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.104.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.104.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.104.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.104.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.104.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.104.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.105.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.105.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.105.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.105.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.105.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.105.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.106.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.106.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.106.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.106.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.106.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.106.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.107.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.107.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.107.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.107.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.107.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.107.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.108.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.108.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.108.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.108.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.108.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.108.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.109.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.109.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.109.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.109.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.109.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.109.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.11.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.11.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.11.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.11.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.11.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.11.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.110.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.110.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.110.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.110.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.110.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.110.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.111.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.111.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.111.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.111.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.111.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.111.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.112.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.112.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.112.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.112.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.112.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.112.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.113.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.113.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.113.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.113.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.113.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.113.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.114.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.114.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.114.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.114.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.114.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.114.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.115.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.115.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.115.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.115.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.115.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.115.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.116.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.116.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.116.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.116.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.116.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.116.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.117.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.117.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.117.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.117.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.117.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.117.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.118.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.118.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.118.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.118.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.118.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.118.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.119.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.119.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.119.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.119.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.119.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.119.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.12.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.12.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.12.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.12.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.12.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.12.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.120.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.120.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.120.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.120.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.120.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.120.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.121.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.121.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.121.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.121.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.121.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.121.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.122.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.122.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.122.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.122.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.122.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.122.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.123.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.123.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.123.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.123.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.123.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.123.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.124.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.124.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.124.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.124.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.124.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.124.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.125.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.125.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.125.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.125.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.125.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.125.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.126.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.126.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.126.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.126.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.126.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.126.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.127.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.127.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.127.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.127.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.127.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.127.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.128.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.128.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.128.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.128.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.128.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.128.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.129.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.129.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.129.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.129.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.129.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.129.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.13.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.13.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.13.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.13.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.13.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.13.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.130.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.130.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.130.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.130.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.130.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.130.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.131.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.131.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.131.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.131.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.131.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.131.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.132.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.132.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.132.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.132.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.132.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.132.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.133.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.133.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.133.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.133.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.133.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.133.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.134.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.134.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.134.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.134.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.134.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.134.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.135.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.135.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.135.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.135.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.135.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.135.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.136.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.136.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.136.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.136.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.136.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.136.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.137.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.137.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.137.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.137.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.137.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.137.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.138.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.138.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.138.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.138.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.138.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.138.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.139.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.139.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.139.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.139.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.139.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.139.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.14.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.14.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.14.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.14.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.14.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.14.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.140.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.140.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.140.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.140.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.140.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.140.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.141.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.141.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.141.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.141.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.141.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.141.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.142.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.142.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.142.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.142.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.142.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.142.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.143.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.143.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.143.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.143.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.143.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.143.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.144.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.144.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.144.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.144.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.144.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.144.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.145.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.145.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.145.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.145.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.145.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.145.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.146.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.146.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.146.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.146.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.146.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.146.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.147.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.147.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.147.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.147.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.147.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.147.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.148.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.148.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.148.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.148.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.148.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.148.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.149.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.149.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.149.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.149.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.149.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.149.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.15.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.15.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.15.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.15.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.15.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.15.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.150.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.150.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.150.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.150.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.150.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.150.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.151.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.151.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.151.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.151.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.151.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.151.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.152.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.152.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.152.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.152.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.152.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.152.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.153.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.153.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.153.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.153.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.153.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.153.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.154.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.154.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.154.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.154.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.154.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.154.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.155.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.155.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.155.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.155.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.155.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.155.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.156.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.156.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.156.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.156.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.156.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.156.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.157.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.157.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.157.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.157.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.157.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.157.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.158.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.158.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.158.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.158.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.158.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.158.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.159.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.159.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.159.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.159.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.159.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.159.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.16.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.16.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.16.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.16.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.16.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.16.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.17.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.17.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.17.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.17.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.17.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.17.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.18.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.18.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.18.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.18.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.18.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.18.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.19.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.19.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.19.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.19.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.19.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.19.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.2.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.2.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.2.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.2.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.2.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.2.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.20.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.20.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.20.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.20.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.20.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.20.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.21.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.21.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.21.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.21.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.21.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.21.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.22.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.22.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.22.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.22.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.22.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.22.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.23.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.23.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.23.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.23.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.23.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.23.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.24.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.24.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.24.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.24.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.24.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.24.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.25.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.25.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.25.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.25.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.25.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.25.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.26.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.26.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.26.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.26.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.26.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.26.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.27.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.27.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.27.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.27.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.27.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.27.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.28.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.28.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.28.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.28.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.28.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.28.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.29.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.29.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.29.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.29.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.29.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.29.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.3.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.3.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.3.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.3.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.3.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.3.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.30.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.30.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.30.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.30.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.30.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.30.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.31.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.31.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.31.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.31.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.31.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.31.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.32.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.32.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.32.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.32.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.32.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.32.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.33.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.33.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.33.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.33.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.33.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.33.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.34.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.34.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.34.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.34.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.34.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.34.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.35.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.35.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.35.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.35.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.35.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.35.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.36.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.36.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.36.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.36.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.36.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.36.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.37.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.37.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.37.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.37.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.37.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.37.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.38.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.38.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.38.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.38.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.38.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.38.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.39.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.39.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.39.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.39.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.39.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.39.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.4.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.4.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.4.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.4.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.4.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.4.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.40.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.40.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.40.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.40.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.40.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.40.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.41.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.41.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.41.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.41.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.41.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.41.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.42.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.42.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.42.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.42.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.42.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.42.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.43.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.43.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.43.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.43.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.43.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.43.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.44.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.44.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.44.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.44.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.44.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.44.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.45.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.45.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.45.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.45.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.45.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.45.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.46.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.46.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.46.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.46.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.46.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.46.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.47.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.47.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.47.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.47.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.47.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.47.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.48.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.48.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.48.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.48.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.48.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.48.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.49.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.49.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.49.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.49.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.49.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.49.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.5.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.5.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.5.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.5.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.5.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.5.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.50.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.50.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.50.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.50.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.50.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.50.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.51.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.51.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.51.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.51.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.51.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.51.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.52.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.52.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.52.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.52.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.52.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.52.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.53.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.53.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.53.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.53.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.53.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.53.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.54.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.54.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.54.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.54.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.54.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.54.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.55.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.55.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.55.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.55.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.55.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.55.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.56.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.56.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.56.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.56.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.56.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.56.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.57.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.57.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.57.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.57.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.57.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.57.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.58.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.58.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.58.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.58.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.58.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.58.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.59.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.59.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.59.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.59.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.59.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.59.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.6.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.6.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.6.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.6.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.6.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.6.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.60.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.60.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.60.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.60.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.60.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.60.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.61.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.61.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.61.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.61.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.61.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.61.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.62.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.62.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.62.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.62.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.62.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.62.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.63.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.63.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.63.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.63.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.63.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.63.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.64.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.64.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.64.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.64.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.64.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.64.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.65.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.65.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.65.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.65.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.65.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.65.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.66.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.66.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.66.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.66.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.66.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.66.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.67.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.67.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.67.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.67.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.67.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.67.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.68.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.68.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.68.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.68.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.68.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.68.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.69.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.69.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.69.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.69.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.69.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.69.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.7.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.7.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.7.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.7.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.7.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.7.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.70.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.70.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.70.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.70.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.70.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.70.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.71.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.71.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.71.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.71.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.71.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.71.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.72.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.72.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.72.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.72.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.72.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.72.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.73.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.73.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.73.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.73.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.73.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.73.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.74.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.74.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.74.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.74.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.74.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.74.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.75.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.75.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.75.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.75.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.75.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.75.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.76.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.76.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.76.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.76.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.76.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.76.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.77.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.77.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.77.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.77.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.77.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.77.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.78.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.78.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.78.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.78.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.78.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.78.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.79.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.79.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.79.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.79.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.79.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.79.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.8.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.8.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.8.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.8.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.8.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.8.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.80.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.80.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.80.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.80.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.80.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.80.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.81.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.81.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.81.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.81.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.81.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.81.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.82.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.82.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.82.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.82.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.82.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.82.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.83.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.83.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.83.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.83.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.83.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.83.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.84.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.84.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.84.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.84.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.84.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.84.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.85.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.85.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.85.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.85.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.85.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.85.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.86.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.86.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.86.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.86.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.86.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.86.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.87.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.87.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.87.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.87.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.87.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.87.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.88.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.88.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.88.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.88.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.88.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.88.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.89.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.89.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.89.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.89.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.89.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.89.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.9.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.9.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.9.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.9.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.9.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.9.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.90.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.90.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.90.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.90.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.90.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.90.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.91.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.91.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.91.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.91.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.91.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.91.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.92.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.92.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.92.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.92.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.92.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.92.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.93.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.93.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.93.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.93.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.93.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.93.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.94.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.94.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.94.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.94.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.94.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.94.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.95.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.95.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.95.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.95.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.95.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.95.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.96.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.96.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.96.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.96.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.96.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.96.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.97.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.97.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.97.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.97.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.97.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.97.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.98.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.98.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.98.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.98.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.98.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.98.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.99.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.99.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.99.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.99.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.99.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.experts.99.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.gate.e_score_correction_bias": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.gate.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.shared_experts.down_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.shared_experts.down_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.shared_experts.gate_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.shared_experts.gate_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.shared_experts.up_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.mlp.shared_experts.up_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.post_attention_layernorm.weight": "model-00011-of-00092.safetensors", + "model.layers.10.self_attn.k_norm.weight": "model-00011-of-00092.safetensors", + "model.layers.10.self_attn.k_proj.bias": "model-00011-of-00092.safetensors", + "model.layers.10.self_attn.k_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.self_attn.k_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.self_attn.o_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.self_attn.o_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.self_attn.q_norm.weight": "model-00011-of-00092.safetensors", + "model.layers.10.self_attn.q_proj.bias": "model-00011-of-00092.safetensors", + "model.layers.10.self_attn.q_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.self_attn.q_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.10.self_attn.v_proj.bias": "model-00011-of-00092.safetensors", + "model.layers.10.self_attn.v_proj.weight": "model-00011-of-00092.safetensors", + "model.layers.10.self_attn.v_proj.weight_scale": "model-00011-of-00092.safetensors", + "model.layers.11.input_layernorm.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.0.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.0.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.0.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.0.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.0.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.0.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.1.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.1.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.1.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.1.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.1.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.1.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.10.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.10.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.10.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.10.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.10.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.10.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.100.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.100.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.100.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.100.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.100.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.100.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.101.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.101.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.101.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.101.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.101.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.101.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.102.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.102.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.102.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.102.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.102.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.102.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.103.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.103.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.103.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.103.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.103.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.103.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.104.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.104.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.104.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.104.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.104.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.104.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.105.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.105.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.105.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.105.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.105.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.105.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.106.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.106.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.106.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.106.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.106.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.106.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.107.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.107.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.107.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.107.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.107.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.107.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.108.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.108.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.108.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.108.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.108.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.108.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.109.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.109.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.109.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.109.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.109.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.109.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.11.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.11.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.11.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.11.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.11.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.11.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.110.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.110.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.110.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.110.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.110.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.110.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.111.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.111.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.111.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.111.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.111.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.111.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.112.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.112.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.112.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.112.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.112.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.112.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.113.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.113.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.113.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.113.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.113.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.113.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.114.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.114.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.114.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.114.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.114.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.114.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.115.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.115.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.115.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.115.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.115.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.115.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.116.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.116.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.116.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.116.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.116.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.116.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.117.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.117.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.117.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.117.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.117.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.117.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.118.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.118.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.118.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.118.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.118.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.118.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.119.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.119.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.119.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.119.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.119.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.119.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.12.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.12.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.12.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.12.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.12.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.12.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.120.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.120.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.120.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.120.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.120.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.120.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.121.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.121.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.121.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.121.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.121.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.121.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.122.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.122.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.122.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.122.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.122.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.122.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.123.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.123.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.123.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.123.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.123.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.123.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.124.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.124.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.124.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.124.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.124.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.124.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.125.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.125.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.125.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.125.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.125.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.125.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.126.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.126.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.126.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.126.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.126.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.126.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.127.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.127.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.127.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.127.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.127.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.127.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.128.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.128.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.128.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.128.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.128.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.128.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.129.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.129.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.129.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.129.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.129.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.129.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.13.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.13.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.13.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.13.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.13.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.13.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.130.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.130.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.130.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.130.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.130.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.130.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.131.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.131.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.131.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.131.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.131.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.131.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.132.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.132.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.132.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.132.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.132.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.132.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.133.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.133.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.133.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.133.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.133.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.133.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.134.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.134.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.134.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.134.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.134.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.134.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.135.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.135.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.135.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.135.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.135.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.135.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.136.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.136.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.136.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.136.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.136.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.136.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.137.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.137.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.137.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.137.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.137.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.137.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.138.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.138.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.138.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.138.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.138.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.138.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.139.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.139.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.139.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.139.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.139.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.139.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.14.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.14.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.14.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.14.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.14.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.14.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.140.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.140.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.140.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.140.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.140.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.140.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.141.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.141.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.141.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.141.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.141.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.141.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.142.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.142.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.142.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.142.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.142.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.142.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.143.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.143.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.143.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.143.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.143.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.143.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.144.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.144.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.144.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.144.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.144.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.144.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.145.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.145.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.145.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.145.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.145.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.145.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.146.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.146.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.146.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.146.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.146.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.146.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.147.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.147.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.147.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.147.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.147.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.147.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.148.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.148.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.148.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.148.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.148.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.148.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.149.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.149.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.149.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.149.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.149.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.149.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.15.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.15.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.15.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.15.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.15.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.15.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.150.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.150.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.150.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.150.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.150.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.150.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.151.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.151.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.151.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.151.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.151.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.151.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.152.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.152.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.152.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.152.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.152.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.152.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.153.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.153.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.153.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.153.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.153.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.153.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.154.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.154.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.154.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.154.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.154.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.154.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.155.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.155.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.155.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.155.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.155.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.155.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.156.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.156.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.156.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.156.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.156.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.156.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.157.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.157.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.157.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.157.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.157.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.157.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.158.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.158.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.158.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.158.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.158.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.158.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.159.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.159.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.159.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.159.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.159.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.159.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.16.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.16.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.16.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.16.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.16.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.16.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.17.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.17.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.17.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.17.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.17.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.17.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.18.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.18.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.18.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.18.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.18.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.18.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.19.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.19.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.19.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.19.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.19.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.19.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.2.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.2.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.2.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.2.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.2.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.2.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.20.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.20.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.20.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.20.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.20.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.20.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.21.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.21.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.21.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.21.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.21.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.21.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.22.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.22.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.22.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.22.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.22.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.22.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.23.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.23.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.23.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.23.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.23.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.23.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.24.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.24.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.24.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.24.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.24.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.24.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.25.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.25.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.25.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.25.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.25.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.25.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.26.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.26.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.26.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.26.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.26.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.26.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.27.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.27.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.27.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.27.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.27.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.27.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.28.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.28.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.28.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.28.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.28.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.28.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.29.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.29.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.29.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.29.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.29.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.29.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.3.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.3.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.3.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.3.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.3.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.3.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.30.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.30.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.30.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.30.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.30.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.30.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.31.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.31.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.31.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.31.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.31.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.31.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.32.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.32.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.32.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.32.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.32.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.32.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.33.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.33.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.33.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.33.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.33.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.33.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.34.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.34.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.34.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.34.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.34.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.34.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.35.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.35.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.35.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.35.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.35.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.35.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.36.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.36.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.36.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.36.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.36.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.36.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.37.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.37.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.37.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.37.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.37.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.37.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.38.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.38.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.38.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.38.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.38.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.38.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.39.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.39.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.39.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.39.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.39.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.39.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.4.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.4.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.4.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.4.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.4.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.4.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.40.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.40.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.40.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.40.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.40.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.40.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.41.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.41.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.41.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.41.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.41.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.41.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.42.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.42.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.42.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.42.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.42.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.42.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.43.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.43.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.43.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.43.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.43.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.43.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.44.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.44.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.44.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.44.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.44.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.44.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.45.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.45.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.45.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.45.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.45.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.45.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.46.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.46.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.46.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.46.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.46.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.46.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.47.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.47.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.47.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.47.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.47.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.47.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.48.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.48.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.48.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.48.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.48.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.48.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.49.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.49.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.49.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.49.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.49.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.49.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.5.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.5.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.5.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.5.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.5.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.5.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.50.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.50.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.50.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.50.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.50.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.50.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.51.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.51.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.51.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.51.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.51.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.51.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.52.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.52.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.52.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.52.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.52.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.52.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.53.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.53.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.53.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.53.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.53.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.53.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.54.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.54.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.54.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.54.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.54.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.54.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.55.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.55.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.55.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.55.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.55.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.55.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.56.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.56.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.56.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.56.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.56.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.56.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.57.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.57.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.57.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.57.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.57.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.57.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.58.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.58.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.58.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.58.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.58.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.58.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.59.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.59.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.59.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.59.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.59.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.59.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.6.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.6.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.6.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.6.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.6.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.6.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.60.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.60.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.60.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.60.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.60.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.60.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.61.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.61.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.61.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.61.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.61.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.61.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.62.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.62.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.62.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.62.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.62.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.62.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.63.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.63.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.63.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.63.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.63.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.63.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.64.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.64.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.64.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.64.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.64.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.64.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.65.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.65.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.65.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.65.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.65.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.65.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.66.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.66.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.66.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.66.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.66.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.66.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.67.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.67.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.67.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.67.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.67.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.67.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.68.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.68.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.68.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.68.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.68.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.68.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.69.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.69.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.69.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.69.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.69.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.69.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.7.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.7.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.7.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.7.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.7.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.7.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.70.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.70.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.70.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.70.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.70.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.70.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.71.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.71.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.71.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.71.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.71.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.71.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.72.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.72.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.72.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.72.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.72.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.72.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.73.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.73.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.73.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.73.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.73.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.73.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.74.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.74.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.74.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.74.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.74.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.74.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.75.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.75.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.75.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.75.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.75.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.75.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.76.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.76.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.76.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.76.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.76.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.76.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.77.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.77.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.77.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.77.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.77.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.77.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.78.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.78.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.78.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.78.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.78.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.78.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.79.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.79.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.79.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.79.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.79.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.79.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.8.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.8.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.8.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.8.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.8.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.8.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.80.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.80.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.80.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.80.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.80.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.80.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.81.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.81.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.81.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.81.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.81.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.81.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.82.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.82.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.82.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.82.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.82.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.82.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.83.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.83.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.83.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.83.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.83.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.83.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.84.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.84.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.84.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.84.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.84.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.84.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.85.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.85.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.85.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.85.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.85.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.85.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.86.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.86.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.86.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.86.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.86.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.86.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.87.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.87.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.87.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.87.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.87.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.87.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.88.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.88.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.88.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.88.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.88.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.88.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.89.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.89.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.89.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.89.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.89.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.89.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.9.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.9.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.9.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.9.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.9.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.9.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.90.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.90.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.90.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.90.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.90.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.90.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.91.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.91.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.91.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.91.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.91.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.91.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.92.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.92.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.92.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.92.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.92.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.92.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.93.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.93.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.93.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.93.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.93.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.93.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.94.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.94.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.94.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.94.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.94.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.94.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.95.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.95.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.95.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.95.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.95.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.95.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.96.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.96.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.96.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.96.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.96.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.96.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.97.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.97.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.97.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.97.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.97.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.97.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.98.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.98.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.98.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.98.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.98.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.98.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.99.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.99.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.99.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.99.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.99.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.experts.99.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.gate.e_score_correction_bias": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.gate.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.shared_experts.down_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.shared_experts.down_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.shared_experts.gate_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.shared_experts.gate_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.shared_experts.up_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.mlp.shared_experts.up_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.post_attention_layernorm.weight": "model-00012-of-00092.safetensors", + "model.layers.11.self_attn.k_norm.weight": "model-00012-of-00092.safetensors", + "model.layers.11.self_attn.k_proj.bias": "model-00012-of-00092.safetensors", + "model.layers.11.self_attn.k_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.self_attn.k_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.self_attn.o_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.self_attn.o_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.self_attn.q_norm.weight": "model-00012-of-00092.safetensors", + "model.layers.11.self_attn.q_proj.bias": "model-00012-of-00092.safetensors", + "model.layers.11.self_attn.q_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.self_attn.q_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.11.self_attn.v_proj.bias": "model-00012-of-00092.safetensors", + "model.layers.11.self_attn.v_proj.weight": "model-00012-of-00092.safetensors", + "model.layers.11.self_attn.v_proj.weight_scale": "model-00012-of-00092.safetensors", + "model.layers.12.input_layernorm.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.0.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.0.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.0.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.0.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.0.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.0.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.1.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.1.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.1.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.1.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.1.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.1.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.10.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.10.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.10.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.10.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.10.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.10.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.100.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.100.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.100.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.100.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.100.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.100.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.101.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.101.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.101.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.101.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.101.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.101.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.102.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.102.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.102.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.102.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.102.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.102.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.103.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.103.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.103.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.103.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.103.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.103.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.104.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.104.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.104.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.104.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.104.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.104.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.105.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.105.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.105.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.105.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.105.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.105.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.106.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.106.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.106.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.106.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.106.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.106.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.107.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.107.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.107.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.107.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.107.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.107.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.108.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.108.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.108.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.108.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.108.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.108.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.109.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.109.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.109.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.109.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.109.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.109.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.11.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.11.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.11.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.11.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.11.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.11.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.110.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.110.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.110.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.110.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.110.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.110.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.111.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.111.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.111.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.111.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.111.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.111.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.112.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.112.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.112.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.112.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.112.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.112.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.113.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.113.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.113.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.113.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.113.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.113.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.114.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.114.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.114.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.114.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.114.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.114.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.115.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.115.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.115.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.115.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.115.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.115.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.116.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.116.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.116.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.116.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.116.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.116.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.117.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.117.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.117.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.117.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.117.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.117.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.118.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.118.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.118.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.118.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.118.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.118.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.119.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.119.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.119.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.119.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.119.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.119.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.12.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.12.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.12.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.12.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.12.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.12.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.120.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.120.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.120.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.120.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.120.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.120.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.121.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.121.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.121.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.121.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.121.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.121.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.122.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.122.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.122.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.122.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.122.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.122.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.123.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.123.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.123.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.123.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.123.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.123.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.124.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.124.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.124.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.124.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.124.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.124.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.125.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.125.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.125.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.125.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.125.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.125.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.126.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.126.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.126.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.126.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.126.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.126.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.127.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.127.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.127.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.127.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.127.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.127.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.128.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.128.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.128.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.128.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.128.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.128.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.129.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.129.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.129.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.129.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.129.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.129.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.13.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.13.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.13.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.13.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.13.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.13.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.130.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.130.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.130.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.130.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.130.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.130.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.131.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.131.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.131.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.131.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.131.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.131.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.132.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.132.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.132.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.132.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.132.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.132.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.133.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.133.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.133.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.133.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.133.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.133.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.134.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.134.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.134.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.134.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.134.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.134.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.135.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.135.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.135.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.135.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.135.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.135.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.136.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.136.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.136.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.136.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.136.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.136.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.137.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.137.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.137.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.137.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.137.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.137.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.138.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.138.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.138.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.138.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.138.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.138.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.139.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.139.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.139.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.139.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.139.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.139.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.14.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.14.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.14.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.14.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.14.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.14.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.140.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.140.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.140.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.140.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.140.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.140.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.141.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.141.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.141.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.141.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.141.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.141.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.142.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.142.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.142.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.142.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.142.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.142.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.143.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.143.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.143.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.143.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.143.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.143.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.144.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.144.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.144.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.144.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.144.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.144.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.145.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.145.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.145.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.145.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.145.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.145.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.146.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.146.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.146.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.146.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.146.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.146.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.147.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.147.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.147.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.147.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.147.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.147.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.148.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.148.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.148.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.148.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.148.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.148.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.149.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.149.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.149.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.149.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.149.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.149.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.15.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.15.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.15.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.15.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.15.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.15.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.150.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.150.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.150.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.150.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.150.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.150.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.151.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.151.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.151.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.151.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.151.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.151.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.152.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.152.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.152.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.152.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.152.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.152.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.153.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.153.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.153.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.153.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.153.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.153.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.154.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.154.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.154.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.154.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.154.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.154.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.155.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.155.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.155.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.155.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.155.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.155.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.156.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.156.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.156.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.156.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.156.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.156.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.157.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.157.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.157.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.157.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.157.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.157.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.158.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.158.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.158.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.158.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.158.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.158.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.159.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.159.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.159.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.159.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.159.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.159.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.16.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.16.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.16.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.16.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.16.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.16.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.17.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.17.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.17.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.17.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.17.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.17.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.18.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.18.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.18.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.18.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.18.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.18.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.19.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.19.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.19.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.19.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.19.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.19.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.2.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.2.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.2.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.2.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.2.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.2.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.20.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.20.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.20.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.20.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.20.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.20.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.21.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.21.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.21.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.21.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.21.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.21.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.22.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.22.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.22.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.22.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.22.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.22.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.23.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.23.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.23.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.23.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.23.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.23.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.24.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.24.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.24.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.24.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.24.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.24.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.25.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.25.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.25.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.25.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.25.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.25.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.26.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.26.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.26.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.26.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.26.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.26.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.27.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.27.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.27.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.27.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.27.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.27.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.28.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.28.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.28.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.28.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.28.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.28.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.29.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.29.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.29.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.29.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.29.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.29.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.3.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.3.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.3.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.3.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.3.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.3.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.30.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.30.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.30.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.30.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.30.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.30.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.31.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.31.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.31.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.31.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.31.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.31.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.32.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.32.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.32.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.32.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.32.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.32.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.33.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.33.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.33.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.33.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.33.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.33.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.34.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.34.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.34.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.34.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.34.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.34.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.35.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.35.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.35.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.35.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.35.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.35.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.36.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.36.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.36.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.36.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.36.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.36.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.37.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.37.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.37.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.37.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.37.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.37.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.38.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.38.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.38.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.38.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.38.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.38.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.39.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.39.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.39.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.39.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.39.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.39.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.4.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.4.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.4.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.4.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.4.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.4.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.40.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.40.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.40.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.40.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.40.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.40.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.41.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.41.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.41.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.41.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.41.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.41.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.42.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.42.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.42.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.42.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.42.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.42.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.43.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.43.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.43.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.43.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.43.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.43.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.44.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.44.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.44.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.44.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.44.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.44.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.45.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.45.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.45.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.45.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.45.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.45.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.46.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.46.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.46.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.46.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.46.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.46.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.47.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.47.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.47.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.47.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.47.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.47.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.48.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.48.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.48.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.48.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.48.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.48.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.49.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.49.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.49.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.49.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.49.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.49.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.5.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.5.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.5.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.5.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.5.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.5.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.50.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.50.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.50.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.50.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.50.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.50.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.51.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.51.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.51.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.51.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.51.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.51.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.52.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.52.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.52.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.52.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.52.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.52.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.53.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.53.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.53.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.53.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.53.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.53.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.54.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.54.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.54.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.54.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.54.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.54.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.55.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.55.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.55.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.55.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.55.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.55.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.56.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.56.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.56.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.56.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.56.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.56.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.57.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.57.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.57.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.57.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.57.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.57.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.58.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.58.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.58.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.58.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.58.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.58.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.59.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.59.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.59.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.59.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.59.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.59.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.6.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.6.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.6.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.6.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.6.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.6.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.60.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.60.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.60.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.60.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.60.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.60.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.61.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.61.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.61.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.61.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.61.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.61.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.62.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.62.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.62.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.62.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.62.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.62.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.63.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.63.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.63.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.63.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.63.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.63.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.64.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.64.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.64.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.64.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.64.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.64.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.65.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.65.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.65.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.65.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.65.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.65.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.66.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.66.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.66.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.66.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.66.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.66.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.67.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.67.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.67.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.67.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.67.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.67.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.68.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.68.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.68.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.68.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.68.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.68.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.69.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.69.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.69.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.69.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.69.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.69.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.7.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.7.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.7.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.7.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.7.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.7.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.70.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.70.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.70.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.70.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.70.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.70.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.71.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.71.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.71.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.71.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.71.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.71.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.72.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.72.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.72.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.72.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.72.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.72.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.73.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.73.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.73.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.73.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.73.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.73.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.74.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.74.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.74.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.74.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.74.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.74.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.75.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.75.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.75.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.75.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.75.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.75.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.76.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.76.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.76.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.76.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.76.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.76.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.77.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.77.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.77.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.77.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.77.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.77.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.78.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.78.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.78.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.78.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.78.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.78.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.79.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.79.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.79.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.79.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.79.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.79.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.8.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.8.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.8.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.8.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.8.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.8.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.80.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.80.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.80.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.80.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.80.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.80.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.81.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.81.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.81.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.81.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.81.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.81.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.82.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.82.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.82.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.82.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.82.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.82.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.83.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.83.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.83.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.83.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.83.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.83.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.84.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.84.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.84.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.84.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.84.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.84.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.85.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.85.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.85.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.85.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.85.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.85.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.86.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.86.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.86.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.86.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.86.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.86.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.87.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.87.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.87.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.87.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.87.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.87.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.88.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.88.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.88.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.88.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.88.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.88.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.89.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.89.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.89.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.89.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.89.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.89.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.9.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.9.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.9.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.9.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.9.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.9.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.90.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.90.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.90.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.90.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.90.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.90.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.91.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.91.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.91.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.91.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.91.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.91.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.92.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.92.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.92.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.92.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.92.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.92.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.93.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.93.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.93.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.93.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.93.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.93.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.94.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.94.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.94.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.94.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.94.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.94.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.95.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.95.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.95.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.95.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.95.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.95.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.96.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.96.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.96.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.96.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.96.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.96.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.97.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.97.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.97.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.97.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.97.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.97.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.98.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.98.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.98.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.98.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.98.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.98.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.99.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.99.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.99.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.99.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.99.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.experts.99.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.gate.e_score_correction_bias": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.gate.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.shared_experts.down_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.shared_experts.down_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.shared_experts.gate_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.shared_experts.gate_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.shared_experts.up_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.mlp.shared_experts.up_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.post_attention_layernorm.weight": "model-00013-of-00092.safetensors", + "model.layers.12.self_attn.k_norm.weight": "model-00013-of-00092.safetensors", + "model.layers.12.self_attn.k_proj.bias": "model-00013-of-00092.safetensors", + "model.layers.12.self_attn.k_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.self_attn.k_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.self_attn.o_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.self_attn.o_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.self_attn.q_norm.weight": "model-00013-of-00092.safetensors", + "model.layers.12.self_attn.q_proj.bias": "model-00013-of-00092.safetensors", + "model.layers.12.self_attn.q_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.self_attn.q_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.12.self_attn.v_proj.bias": "model-00013-of-00092.safetensors", + "model.layers.12.self_attn.v_proj.weight": "model-00013-of-00092.safetensors", + "model.layers.12.self_attn.v_proj.weight_scale": "model-00013-of-00092.safetensors", + "model.layers.13.input_layernorm.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.0.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.0.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.0.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.0.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.0.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.0.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.1.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.1.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.1.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.1.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.1.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.1.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.10.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.10.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.10.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.10.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.10.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.10.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.100.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.100.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.100.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.100.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.100.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.100.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.101.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.101.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.101.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.101.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.101.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.101.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.102.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.102.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.102.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.102.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.102.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.102.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.103.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.103.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.103.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.103.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.103.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.103.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.104.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.104.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.104.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.104.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.104.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.104.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.105.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.105.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.105.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.105.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.105.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.105.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.106.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.106.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.106.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.106.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.106.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.106.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.107.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.107.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.107.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.107.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.107.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.107.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.108.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.108.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.108.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.108.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.108.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.108.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.109.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.109.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.109.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.109.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.109.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.109.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.11.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.11.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.11.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.11.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.11.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.11.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.110.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.110.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.110.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.110.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.110.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.110.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.111.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.111.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.111.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.111.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.111.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.111.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.112.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.112.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.112.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.112.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.112.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.112.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.113.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.113.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.113.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.113.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.113.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.113.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.114.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.114.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.114.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.114.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.114.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.114.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.115.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.115.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.115.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.115.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.115.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.115.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.116.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.116.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.116.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.116.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.116.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.116.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.117.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.117.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.117.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.117.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.117.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.117.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.118.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.118.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.118.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.118.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.118.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.118.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.119.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.119.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.119.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.119.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.119.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.119.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.12.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.12.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.12.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.12.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.12.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.12.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.120.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.120.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.120.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.120.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.120.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.120.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.121.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.121.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.121.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.121.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.121.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.121.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.122.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.122.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.122.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.122.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.122.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.122.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.123.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.123.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.123.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.123.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.123.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.123.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.124.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.124.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.124.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.124.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.124.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.124.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.125.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.125.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.125.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.125.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.125.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.125.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.126.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.126.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.126.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.126.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.126.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.126.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.127.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.127.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.127.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.127.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.127.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.127.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.128.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.128.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.128.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.128.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.128.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.128.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.129.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.129.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.129.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.129.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.129.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.129.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.13.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.13.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.13.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.13.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.13.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.13.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.130.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.130.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.130.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.130.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.130.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.130.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.131.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.131.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.131.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.131.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.131.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.131.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.132.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.132.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.132.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.132.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.132.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.132.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.133.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.133.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.133.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.133.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.133.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.133.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.134.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.134.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.134.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.134.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.134.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.134.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.135.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.135.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.135.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.135.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.135.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.135.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.136.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.136.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.136.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.136.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.136.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.136.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.137.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.137.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.137.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.137.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.137.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.137.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.138.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.138.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.138.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.138.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.138.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.138.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.139.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.139.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.139.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.139.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.139.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.139.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.14.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.14.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.14.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.14.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.14.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.14.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.140.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.140.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.140.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.140.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.140.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.140.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.141.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.141.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.141.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.141.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.141.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.141.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.142.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.142.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.142.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.142.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.142.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.142.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.143.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.143.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.143.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.143.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.143.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.143.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.144.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.144.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.144.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.144.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.144.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.144.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.145.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.145.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.145.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.145.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.145.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.145.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.146.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.146.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.146.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.146.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.146.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.146.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.147.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.147.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.147.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.147.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.147.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.147.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.148.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.148.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.148.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.148.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.148.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.148.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.149.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.149.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.149.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.149.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.149.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.149.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.15.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.15.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.15.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.15.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.15.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.15.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.150.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.150.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.150.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.150.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.150.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.150.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.151.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.151.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.151.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.151.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.151.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.151.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.152.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.152.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.152.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.152.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.152.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.152.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.153.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.153.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.153.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.153.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.153.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.153.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.154.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.154.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.154.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.154.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.154.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.154.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.155.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.155.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.155.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.155.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.155.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.155.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.156.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.156.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.156.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.156.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.156.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.156.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.157.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.157.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.157.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.157.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.157.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.157.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.158.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.158.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.158.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.158.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.158.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.158.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.159.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.159.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.159.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.159.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.159.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.159.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.16.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.16.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.16.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.16.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.16.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.16.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.17.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.17.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.17.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.17.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.17.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.17.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.18.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.18.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.18.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.18.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.18.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.18.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.19.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.19.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.19.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.19.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.19.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.19.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.2.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.2.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.2.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.2.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.2.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.2.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.20.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.20.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.20.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.20.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.20.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.20.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.21.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.21.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.21.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.21.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.21.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.21.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.22.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.22.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.22.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.22.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.22.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.22.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.23.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.23.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.23.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.23.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.23.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.23.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.24.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.24.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.24.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.24.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.24.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.24.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.25.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.25.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.25.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.25.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.25.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.25.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.26.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.26.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.26.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.26.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.26.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.26.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.27.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.27.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.27.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.27.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.27.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.27.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.28.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.28.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.28.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.28.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.28.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.28.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.29.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.29.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.29.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.29.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.29.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.29.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.3.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.3.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.3.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.3.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.3.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.3.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.30.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.30.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.30.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.30.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.30.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.30.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.31.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.31.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.31.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.31.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.31.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.31.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.32.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.32.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.32.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.32.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.32.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.32.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.33.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.33.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.33.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.33.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.33.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.33.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.34.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.34.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.34.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.34.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.34.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.34.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.35.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.35.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.35.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.35.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.35.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.35.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.36.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.36.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.36.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.36.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.36.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.36.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.37.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.37.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.37.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.37.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.37.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.37.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.38.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.38.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.38.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.38.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.38.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.38.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.39.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.39.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.39.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.39.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.39.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.39.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.4.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.4.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.4.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.4.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.4.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.4.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.40.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.40.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.40.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.40.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.40.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.40.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.41.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.41.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.41.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.41.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.41.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.41.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.42.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.42.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.42.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.42.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.42.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.42.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.43.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.43.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.43.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.43.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.43.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.43.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.44.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.44.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.44.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.44.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.44.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.44.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.45.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.45.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.45.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.45.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.45.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.45.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.46.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.46.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.46.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.46.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.46.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.46.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.47.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.47.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.47.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.47.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.47.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.47.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.48.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.48.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.48.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.48.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.48.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.48.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.49.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.49.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.49.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.49.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.49.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.49.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.5.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.5.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.5.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.5.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.5.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.5.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.50.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.50.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.50.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.50.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.50.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.50.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.51.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.51.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.51.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.51.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.51.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.51.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.52.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.52.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.52.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.52.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.52.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.52.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.53.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.53.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.53.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.53.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.53.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.53.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.54.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.54.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.54.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.54.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.54.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.54.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.55.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.55.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.55.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.55.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.55.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.55.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.56.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.56.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.56.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.56.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.56.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.56.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.57.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.57.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.57.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.57.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.57.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.57.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.58.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.58.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.58.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.58.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.58.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.58.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.59.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.59.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.59.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.59.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.59.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.59.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.6.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.6.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.6.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.6.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.6.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.6.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.60.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.60.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.60.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.60.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.60.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.60.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.61.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.61.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.61.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.61.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.61.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.61.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.62.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.62.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.62.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.62.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.62.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.62.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.63.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.63.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.63.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.63.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.63.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.63.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.64.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.64.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.64.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.64.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.64.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.64.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.65.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.65.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.65.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.65.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.65.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.65.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.66.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.66.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.66.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.66.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.66.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.66.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.67.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.67.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.67.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.67.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.67.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.67.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.68.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.68.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.68.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.68.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.68.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.68.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.69.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.69.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.69.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.69.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.69.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.69.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.7.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.7.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.7.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.7.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.7.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.7.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.70.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.70.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.70.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.70.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.70.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.70.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.71.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.71.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.71.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.71.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.71.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.71.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.72.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.72.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.72.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.72.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.72.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.72.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.73.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.73.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.73.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.73.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.73.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.73.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.74.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.74.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.74.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.74.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.74.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.74.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.75.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.75.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.75.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.75.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.75.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.75.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.76.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.76.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.76.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.76.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.76.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.76.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.77.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.77.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.77.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.77.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.77.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.77.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.78.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.78.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.78.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.78.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.78.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.78.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.79.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.79.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.79.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.79.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.79.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.79.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.8.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.8.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.8.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.8.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.8.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.8.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.80.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.80.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.80.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.80.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.80.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.80.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.81.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.81.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.81.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.81.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.81.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.81.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.82.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.82.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.82.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.82.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.82.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.82.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.83.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.83.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.83.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.83.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.83.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.83.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.84.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.84.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.84.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.84.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.84.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.84.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.85.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.85.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.85.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.85.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.85.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.85.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.86.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.86.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.86.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.86.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.86.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.86.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.87.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.87.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.87.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.87.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.87.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.87.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.88.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.88.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.88.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.88.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.88.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.88.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.89.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.89.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.89.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.89.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.89.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.89.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.9.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.9.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.9.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.9.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.9.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.9.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.90.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.90.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.90.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.90.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.90.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.90.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.91.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.91.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.91.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.91.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.91.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.91.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.92.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.92.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.92.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.92.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.92.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.92.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.93.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.93.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.93.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.93.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.93.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.93.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.94.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.94.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.94.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.94.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.94.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.94.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.95.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.95.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.95.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.95.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.95.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.95.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.96.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.96.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.96.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.96.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.96.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.96.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.97.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.97.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.97.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.97.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.97.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.97.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.98.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.98.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.98.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.98.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.98.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.98.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.99.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.99.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.99.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.99.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.99.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.experts.99.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.gate.e_score_correction_bias": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.gate.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.shared_experts.down_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.shared_experts.down_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.shared_experts.gate_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.shared_experts.gate_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.shared_experts.up_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.mlp.shared_experts.up_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.post_attention_layernorm.weight": "model-00014-of-00092.safetensors", + "model.layers.13.self_attn.k_norm.weight": "model-00014-of-00092.safetensors", + "model.layers.13.self_attn.k_proj.bias": "model-00014-of-00092.safetensors", + "model.layers.13.self_attn.k_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.self_attn.k_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.self_attn.o_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.self_attn.o_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.self_attn.q_norm.weight": "model-00014-of-00092.safetensors", + "model.layers.13.self_attn.q_proj.bias": "model-00014-of-00092.safetensors", + "model.layers.13.self_attn.q_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.self_attn.q_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.13.self_attn.v_proj.bias": "model-00014-of-00092.safetensors", + "model.layers.13.self_attn.v_proj.weight": "model-00014-of-00092.safetensors", + "model.layers.13.self_attn.v_proj.weight_scale": "model-00014-of-00092.safetensors", + "model.layers.14.input_layernorm.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.0.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.0.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.0.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.0.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.0.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.0.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.1.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.1.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.1.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.1.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.1.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.1.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.10.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.10.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.10.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.10.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.10.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.10.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.100.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.100.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.100.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.100.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.100.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.100.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.101.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.101.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.101.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.101.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.101.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.101.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.102.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.102.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.102.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.102.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.102.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.102.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.103.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.103.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.103.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.103.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.103.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.103.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.104.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.104.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.104.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.104.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.104.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.104.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.105.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.105.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.105.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.105.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.105.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.105.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.106.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.106.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.106.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.106.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.106.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.106.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.107.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.107.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.107.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.107.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.107.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.107.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.108.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.108.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.108.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.108.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.108.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.108.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.109.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.109.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.109.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.109.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.109.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.109.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.11.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.11.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.11.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.11.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.11.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.11.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.110.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.110.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.110.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.110.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.110.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.110.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.111.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.111.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.111.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.111.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.111.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.111.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.112.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.112.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.112.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.112.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.112.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.112.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.113.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.113.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.113.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.113.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.113.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.113.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.114.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.114.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.114.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.114.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.114.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.114.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.115.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.115.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.115.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.115.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.115.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.115.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.116.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.116.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.116.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.116.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.116.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.116.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.117.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.117.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.117.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.117.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.117.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.117.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.118.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.118.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.118.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.118.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.118.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.118.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.119.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.119.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.119.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.119.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.119.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.119.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.12.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.12.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.12.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.12.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.12.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.12.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.120.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.120.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.120.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.120.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.120.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.120.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.121.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.121.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.121.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.121.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.121.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.121.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.122.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.122.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.122.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.122.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.122.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.122.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.123.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.123.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.123.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.123.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.123.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.123.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.124.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.124.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.124.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.124.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.124.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.124.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.125.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.125.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.125.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.125.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.125.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.125.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.126.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.126.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.126.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.126.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.126.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.126.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.127.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.127.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.127.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.127.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.127.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.127.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.128.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.128.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.128.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.128.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.128.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.128.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.129.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.129.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.129.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.129.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.129.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.129.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.13.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.13.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.13.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.13.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.13.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.13.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.130.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.130.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.130.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.130.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.130.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.130.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.131.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.131.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.131.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.131.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.131.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.131.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.132.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.132.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.132.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.132.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.132.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.132.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.133.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.133.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.133.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.133.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.133.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.133.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.134.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.134.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.134.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.134.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.134.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.134.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.135.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.135.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.135.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.135.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.135.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.135.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.136.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.136.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.136.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.136.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.136.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.136.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.137.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.137.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.137.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.137.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.137.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.137.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.138.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.138.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.138.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.138.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.138.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.138.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.139.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.139.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.139.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.139.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.139.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.139.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.14.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.14.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.14.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.14.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.14.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.14.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.140.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.140.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.140.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.140.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.140.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.140.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.141.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.141.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.141.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.141.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.141.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.141.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.142.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.142.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.142.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.142.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.142.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.142.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.143.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.143.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.143.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.143.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.143.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.143.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.144.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.144.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.144.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.144.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.144.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.144.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.145.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.145.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.145.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.145.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.145.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.145.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.146.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.146.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.146.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.146.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.146.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.146.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.147.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.147.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.147.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.147.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.147.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.147.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.148.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.148.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.148.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.148.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.148.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.148.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.149.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.149.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.149.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.149.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.149.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.149.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.15.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.15.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.15.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.15.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.15.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.15.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.150.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.150.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.150.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.150.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.150.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.150.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.151.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.151.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.151.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.151.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.151.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.151.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.152.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.152.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.152.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.152.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.152.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.152.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.153.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.153.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.153.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.153.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.153.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.153.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.154.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.154.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.154.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.154.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.154.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.154.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.155.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.155.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.155.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.155.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.155.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.155.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.156.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.156.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.156.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.156.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.156.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.156.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.157.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.157.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.157.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.157.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.157.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.157.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.158.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.158.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.158.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.158.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.158.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.158.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.159.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.159.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.159.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.159.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.159.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.159.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.16.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.16.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.16.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.16.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.16.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.16.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.17.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.17.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.17.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.17.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.17.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.17.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.18.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.18.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.18.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.18.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.18.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.18.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.19.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.19.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.19.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.19.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.19.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.19.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.2.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.2.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.2.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.2.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.2.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.2.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.20.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.20.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.20.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.20.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.20.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.20.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.21.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.21.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.21.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.21.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.21.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.21.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.22.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.22.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.22.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.22.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.22.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.22.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.23.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.23.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.23.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.23.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.23.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.23.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.24.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.24.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.24.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.24.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.24.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.24.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.25.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.25.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.25.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.25.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.25.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.25.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.26.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.26.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.26.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.26.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.26.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.26.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.27.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.27.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.27.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.27.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.27.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.27.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.28.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.28.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.28.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.28.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.28.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.28.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.29.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.29.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.29.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.29.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.29.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.29.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.3.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.3.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.3.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.3.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.3.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.3.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.30.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.30.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.30.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.30.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.30.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.30.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.31.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.31.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.31.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.31.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.31.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.31.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.32.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.32.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.32.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.32.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.32.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.32.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.33.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.33.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.33.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.33.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.33.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.33.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.34.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.34.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.34.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.34.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.34.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.34.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.35.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.35.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.35.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.35.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.35.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.35.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.36.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.36.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.36.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.36.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.36.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.36.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.37.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.37.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.37.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.37.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.37.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.37.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.38.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.38.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.38.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.38.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.38.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.38.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.39.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.39.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.39.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.39.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.39.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.39.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.4.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.4.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.4.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.4.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.4.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.4.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.40.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.40.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.40.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.40.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.40.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.40.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.41.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.41.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.41.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.41.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.41.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.41.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.42.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.42.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.42.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.42.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.42.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.42.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.43.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.43.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.43.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.43.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.43.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.43.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.44.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.44.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.44.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.44.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.44.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.44.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.45.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.45.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.45.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.45.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.45.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.45.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.46.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.46.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.46.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.46.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.46.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.46.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.47.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.47.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.47.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.47.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.47.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.47.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.48.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.48.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.48.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.48.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.48.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.48.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.49.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.49.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.49.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.49.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.49.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.49.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.5.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.5.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.5.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.5.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.5.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.5.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.50.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.50.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.50.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.50.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.50.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.50.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.51.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.51.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.51.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.51.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.51.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.51.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.52.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.52.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.52.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.52.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.52.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.52.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.53.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.53.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.53.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.53.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.53.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.53.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.54.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.54.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.54.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.54.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.54.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.54.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.55.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.55.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.55.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.55.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.55.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.55.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.56.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.56.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.56.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.56.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.56.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.56.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.57.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.57.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.57.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.57.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.57.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.57.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.58.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.58.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.58.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.58.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.58.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.58.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.59.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.59.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.59.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.59.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.59.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.59.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.6.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.6.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.6.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.6.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.6.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.6.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.60.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.60.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.60.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.60.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.60.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.60.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.61.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.61.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.61.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.61.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.61.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.61.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.62.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.62.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.62.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.62.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.62.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.62.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.63.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.63.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.63.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.63.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.63.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.63.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.64.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.64.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.64.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.64.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.64.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.64.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.65.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.65.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.65.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.65.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.65.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.65.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.66.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.66.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.66.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.66.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.66.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.66.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.67.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.67.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.67.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.67.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.67.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.67.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.68.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.68.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.68.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.68.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.68.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.68.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.69.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.69.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.69.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.69.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.69.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.69.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.7.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.7.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.7.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.7.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.7.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.7.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.70.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.70.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.70.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.70.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.70.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.70.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.71.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.71.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.71.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.71.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.71.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.71.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.72.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.72.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.72.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.72.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.72.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.72.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.73.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.73.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.73.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.73.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.73.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.73.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.74.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.74.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.74.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.74.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.74.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.74.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.75.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.75.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.75.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.75.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.75.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.75.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.76.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.76.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.76.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.76.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.76.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.76.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.77.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.77.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.77.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.77.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.77.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.77.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.78.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.78.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.78.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.78.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.78.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.78.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.79.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.79.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.79.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.79.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.79.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.79.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.8.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.8.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.8.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.8.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.8.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.8.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.80.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.80.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.80.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.80.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.80.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.80.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.81.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.81.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.81.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.81.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.81.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.81.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.82.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.82.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.82.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.82.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.82.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.82.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.83.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.83.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.83.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.83.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.83.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.83.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.84.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.84.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.84.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.84.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.84.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.84.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.85.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.85.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.85.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.85.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.85.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.85.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.86.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.86.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.86.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.86.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.86.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.86.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.87.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.87.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.87.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.87.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.87.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.87.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.88.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.88.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.88.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.88.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.88.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.88.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.89.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.89.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.89.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.89.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.89.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.89.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.9.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.9.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.9.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.9.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.9.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.9.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.90.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.90.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.90.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.90.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.90.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.90.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.91.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.91.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.91.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.91.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.91.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.91.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.92.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.92.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.92.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.92.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.92.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.92.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.93.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.93.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.93.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.93.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.93.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.93.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.94.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.94.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.94.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.94.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.94.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.94.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.95.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.95.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.95.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.95.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.95.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.95.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.96.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.96.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.96.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.96.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.96.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.96.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.97.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.97.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.97.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.97.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.97.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.97.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.98.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.98.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.98.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.98.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.98.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.98.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.99.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.99.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.99.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.99.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.99.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.experts.99.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.gate.e_score_correction_bias": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.gate.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.shared_experts.down_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.shared_experts.down_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.shared_experts.gate_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.shared_experts.gate_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.shared_experts.up_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.mlp.shared_experts.up_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.post_attention_layernorm.weight": "model-00015-of-00092.safetensors", + "model.layers.14.self_attn.k_norm.weight": "model-00015-of-00092.safetensors", + "model.layers.14.self_attn.k_proj.bias": "model-00015-of-00092.safetensors", + "model.layers.14.self_attn.k_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.self_attn.k_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.self_attn.o_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.self_attn.o_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.self_attn.q_norm.weight": "model-00015-of-00092.safetensors", + "model.layers.14.self_attn.q_proj.bias": "model-00015-of-00092.safetensors", + "model.layers.14.self_attn.q_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.self_attn.q_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.14.self_attn.v_proj.bias": "model-00015-of-00092.safetensors", + "model.layers.14.self_attn.v_proj.weight": "model-00015-of-00092.safetensors", + "model.layers.14.self_attn.v_proj.weight_scale": "model-00015-of-00092.safetensors", + "model.layers.15.input_layernorm.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.0.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.0.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.0.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.0.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.0.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.0.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.1.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.1.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.1.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.1.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.1.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.1.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.10.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.10.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.10.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.10.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.10.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.10.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.100.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.100.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.100.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.100.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.100.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.100.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.101.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.101.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.101.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.101.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.101.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.101.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.102.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.102.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.102.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.102.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.102.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.102.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.103.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.103.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.103.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.103.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.103.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.103.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.104.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.104.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.104.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.104.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.104.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.104.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.105.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.105.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.105.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.105.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.105.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.105.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.106.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.106.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.106.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.106.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.106.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.106.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.107.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.107.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.107.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.107.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.107.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.107.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.108.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.108.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.108.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.108.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.108.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.108.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.109.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.109.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.109.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.109.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.109.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.109.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.11.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.11.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.11.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.11.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.11.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.11.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.110.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.110.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.110.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.110.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.110.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.110.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.111.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.111.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.111.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.111.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.111.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.111.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.112.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.112.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.112.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.112.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.112.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.112.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.113.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.113.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.113.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.113.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.113.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.113.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.114.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.114.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.114.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.114.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.114.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.114.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.115.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.115.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.115.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.115.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.115.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.115.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.116.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.116.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.116.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.116.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.116.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.116.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.117.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.117.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.117.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.117.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.117.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.117.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.118.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.118.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.118.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.118.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.118.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.118.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.119.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.119.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.119.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.119.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.119.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.119.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.12.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.12.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.12.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.12.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.12.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.12.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.120.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.120.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.120.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.120.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.120.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.120.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.121.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.121.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.121.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.121.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.121.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.121.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.122.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.122.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.122.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.122.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.122.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.122.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.123.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.123.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.123.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.123.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.123.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.123.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.124.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.124.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.124.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.124.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.124.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.124.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.125.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.125.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.125.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.125.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.125.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.125.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.126.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.126.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.126.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.126.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.126.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.126.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.127.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.127.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.127.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.127.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.127.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.127.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.128.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.128.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.128.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.128.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.128.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.128.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.129.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.129.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.129.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.129.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.129.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.129.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.13.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.13.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.13.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.13.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.13.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.13.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.130.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.130.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.130.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.130.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.130.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.130.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.131.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.131.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.131.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.131.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.131.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.131.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.132.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.132.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.132.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.132.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.132.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.132.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.133.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.133.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.133.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.133.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.133.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.133.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.134.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.134.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.134.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.134.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.134.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.134.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.135.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.135.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.135.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.135.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.135.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.135.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.136.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.136.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.136.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.136.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.136.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.136.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.137.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.137.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.137.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.137.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.137.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.137.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.138.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.138.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.138.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.138.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.138.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.138.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.139.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.139.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.139.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.139.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.139.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.139.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.14.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.14.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.14.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.14.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.14.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.14.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.140.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.140.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.140.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.140.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.140.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.140.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.141.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.141.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.141.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.141.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.141.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.141.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.142.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.142.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.142.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.142.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.142.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.142.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.143.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.143.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.143.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.143.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.143.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.143.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.144.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.144.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.144.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.144.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.144.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.144.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.145.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.145.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.145.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.145.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.145.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.145.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.146.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.146.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.146.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.146.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.146.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.146.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.147.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.147.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.147.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.147.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.147.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.147.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.148.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.148.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.148.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.148.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.148.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.148.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.149.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.149.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.149.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.149.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.149.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.149.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.15.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.15.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.15.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.15.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.15.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.15.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.150.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.150.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.150.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.150.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.150.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.150.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.151.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.151.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.151.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.151.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.151.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.151.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.152.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.152.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.152.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.152.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.152.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.152.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.153.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.153.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.153.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.153.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.153.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.153.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.154.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.154.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.154.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.154.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.154.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.154.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.155.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.155.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.155.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.155.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.155.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.155.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.156.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.156.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.156.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.156.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.156.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.156.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.157.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.157.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.157.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.157.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.157.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.157.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.158.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.158.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.158.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.158.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.158.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.158.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.159.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.159.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.159.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.159.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.159.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.159.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.16.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.16.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.16.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.16.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.16.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.16.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.17.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.17.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.17.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.17.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.17.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.17.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.18.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.18.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.18.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.18.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.18.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.18.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.19.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.19.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.19.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.19.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.19.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.19.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.2.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.2.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.2.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.2.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.2.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.2.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.20.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.20.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.20.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.20.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.20.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.20.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.21.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.21.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.21.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.21.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.21.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.21.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.22.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.22.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.22.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.22.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.22.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.22.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.23.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.23.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.23.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.23.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.23.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.23.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.24.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.24.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.24.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.24.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.24.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.24.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.25.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.25.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.25.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.25.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.25.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.25.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.26.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.26.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.26.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.26.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.26.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.26.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.27.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.27.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.27.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.27.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.27.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.27.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.28.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.28.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.28.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.28.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.28.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.28.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.29.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.29.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.29.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.29.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.29.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.29.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.3.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.3.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.3.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.3.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.3.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.3.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.30.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.30.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.30.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.30.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.30.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.30.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.31.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.31.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.31.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.31.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.31.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.31.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.32.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.32.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.32.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.32.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.32.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.32.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.33.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.33.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.33.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.33.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.33.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.33.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.34.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.34.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.34.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.34.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.34.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.34.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.35.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.35.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.35.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.35.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.35.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.35.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.36.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.36.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.36.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.36.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.36.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.36.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.37.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.37.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.37.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.37.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.37.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.37.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.38.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.38.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.38.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.38.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.38.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.38.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.39.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.39.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.39.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.39.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.39.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.39.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.4.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.4.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.4.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.4.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.4.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.4.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.40.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.40.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.40.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.40.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.40.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.40.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.41.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.41.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.41.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.41.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.41.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.41.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.42.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.42.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.42.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.42.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.42.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.42.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.43.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.43.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.43.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.43.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.43.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.43.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.44.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.44.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.44.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.44.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.44.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.44.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.45.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.45.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.45.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.45.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.45.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.45.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.46.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.46.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.46.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.46.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.46.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.46.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.47.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.47.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.47.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.47.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.47.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.47.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.48.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.48.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.48.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.48.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.48.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.48.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.49.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.49.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.49.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.49.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.49.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.49.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.5.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.5.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.5.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.5.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.5.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.5.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.50.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.50.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.50.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.50.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.50.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.50.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.51.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.51.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.51.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.51.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.51.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.51.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.52.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.52.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.52.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.52.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.52.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.52.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.53.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.53.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.53.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.53.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.53.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.53.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.54.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.54.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.54.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.54.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.54.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.54.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.55.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.55.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.55.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.55.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.55.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.55.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.56.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.56.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.56.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.56.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.56.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.56.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.57.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.57.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.57.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.57.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.57.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.57.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.58.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.58.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.58.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.58.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.58.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.58.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.59.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.59.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.59.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.59.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.59.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.59.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.6.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.6.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.6.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.6.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.6.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.6.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.60.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.60.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.60.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.60.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.60.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.60.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.61.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.61.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.61.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.61.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.61.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.61.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.62.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.62.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.62.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.62.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.62.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.62.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.63.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.63.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.63.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.63.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.63.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.63.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.64.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.64.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.64.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.64.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.64.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.64.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.65.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.65.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.65.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.65.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.65.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.65.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.66.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.66.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.66.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.66.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.66.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.66.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.67.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.67.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.67.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.67.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.67.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.67.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.68.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.68.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.68.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.68.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.68.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.68.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.69.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.69.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.69.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.69.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.69.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.69.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.7.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.7.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.7.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.7.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.7.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.7.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.70.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.70.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.70.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.70.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.70.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.70.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.71.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.71.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.71.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.71.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.71.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.71.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.72.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.72.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.72.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.72.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.72.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.72.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.73.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.73.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.73.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.73.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.73.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.73.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.74.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.74.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.74.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.74.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.74.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.74.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.75.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.75.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.75.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.75.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.75.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.75.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.76.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.76.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.76.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.76.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.76.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.76.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.77.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.77.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.77.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.77.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.77.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.77.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.78.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.78.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.78.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.78.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.78.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.78.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.79.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.79.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.79.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.79.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.79.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.79.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.8.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.8.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.8.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.8.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.8.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.8.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.80.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.80.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.80.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.80.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.80.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.80.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.81.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.81.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.81.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.81.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.81.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.81.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.82.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.82.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.82.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.82.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.82.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.82.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.83.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.83.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.83.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.83.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.83.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.83.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.84.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.84.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.84.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.84.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.84.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.84.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.85.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.85.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.85.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.85.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.85.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.85.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.86.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.86.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.86.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.86.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.86.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.86.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.87.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.87.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.87.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.87.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.87.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.87.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.88.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.88.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.88.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.88.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.88.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.88.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.89.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.89.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.89.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.89.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.89.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.89.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.9.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.9.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.9.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.9.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.9.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.9.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.90.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.90.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.90.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.90.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.90.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.90.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.91.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.91.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.91.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.91.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.91.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.91.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.92.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.92.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.92.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.92.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.92.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.92.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.93.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.93.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.93.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.93.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.93.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.93.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.94.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.94.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.94.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.94.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.94.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.94.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.95.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.95.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.95.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.95.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.95.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.95.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.96.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.96.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.96.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.96.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.96.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.96.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.97.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.97.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.97.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.97.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.97.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.97.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.98.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.98.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.98.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.98.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.98.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.98.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.99.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.99.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.99.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.99.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.99.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.experts.99.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.gate.e_score_correction_bias": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.gate.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.shared_experts.down_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.shared_experts.down_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.shared_experts.gate_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.shared_experts.gate_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.shared_experts.up_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.mlp.shared_experts.up_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.post_attention_layernorm.weight": "model-00016-of-00092.safetensors", + "model.layers.15.self_attn.k_norm.weight": "model-00016-of-00092.safetensors", + "model.layers.15.self_attn.k_proj.bias": "model-00016-of-00092.safetensors", + "model.layers.15.self_attn.k_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.self_attn.k_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.self_attn.o_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.self_attn.o_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.self_attn.q_norm.weight": "model-00016-of-00092.safetensors", + "model.layers.15.self_attn.q_proj.bias": "model-00016-of-00092.safetensors", + "model.layers.15.self_attn.q_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.self_attn.q_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.15.self_attn.v_proj.bias": "model-00016-of-00092.safetensors", + "model.layers.15.self_attn.v_proj.weight": "model-00016-of-00092.safetensors", + "model.layers.15.self_attn.v_proj.weight_scale": "model-00016-of-00092.safetensors", + "model.layers.16.input_layernorm.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.0.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.0.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.0.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.0.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.0.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.0.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.1.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.1.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.1.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.1.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.1.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.1.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.10.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.10.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.10.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.10.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.10.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.10.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.100.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.100.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.100.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.100.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.100.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.100.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.101.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.101.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.101.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.101.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.101.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.101.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.102.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.102.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.102.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.102.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.102.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.102.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.103.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.103.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.103.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.103.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.103.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.103.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.104.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.104.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.104.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.104.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.104.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.104.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.105.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.105.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.105.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.105.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.105.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.105.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.106.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.106.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.106.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.106.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.106.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.106.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.107.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.107.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.107.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.107.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.107.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.107.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.108.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.108.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.108.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.108.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.108.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.108.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.109.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.109.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.109.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.109.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.109.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.109.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.11.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.11.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.11.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.11.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.11.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.11.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.110.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.110.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.110.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.110.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.110.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.110.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.111.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.111.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.111.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.111.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.111.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.111.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.112.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.112.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.112.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.112.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.112.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.112.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.113.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.113.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.113.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.113.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.113.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.113.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.114.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.114.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.114.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.114.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.114.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.114.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.115.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.115.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.115.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.115.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.115.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.115.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.116.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.116.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.116.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.116.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.116.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.116.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.117.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.117.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.117.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.117.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.117.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.117.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.118.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.118.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.118.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.118.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.118.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.118.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.119.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.119.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.119.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.119.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.119.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.119.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.12.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.12.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.12.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.12.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.12.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.12.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.120.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.120.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.120.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.120.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.120.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.120.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.121.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.121.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.121.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.121.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.121.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.121.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.122.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.122.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.122.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.122.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.122.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.122.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.123.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.123.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.123.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.123.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.123.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.123.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.124.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.124.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.124.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.124.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.124.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.124.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.125.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.125.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.125.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.125.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.125.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.125.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.126.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.126.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.126.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.126.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.126.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.126.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.127.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.127.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.127.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.127.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.127.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.127.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.128.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.128.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.128.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.128.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.128.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.128.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.129.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.129.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.129.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.129.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.129.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.129.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.13.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.13.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.13.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.13.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.13.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.13.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.130.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.130.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.130.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.130.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.130.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.130.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.131.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.131.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.131.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.131.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.131.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.131.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.132.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.132.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.132.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.132.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.132.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.132.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.133.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.133.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.133.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.133.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.133.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.133.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.134.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.134.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.134.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.134.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.134.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.134.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.135.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.135.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.135.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.135.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.135.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.135.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.136.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.136.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.136.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.136.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.136.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.136.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.137.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.137.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.137.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.137.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.137.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.137.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.138.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.138.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.138.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.138.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.138.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.138.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.139.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.139.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.139.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.139.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.139.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.139.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.14.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.14.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.14.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.14.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.14.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.14.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.140.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.140.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.140.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.140.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.140.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.140.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.141.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.141.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.141.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.141.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.141.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.141.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.142.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.142.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.142.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.142.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.142.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.142.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.143.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.143.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.143.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.143.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.143.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.143.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.144.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.144.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.144.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.144.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.144.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.144.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.145.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.145.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.145.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.145.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.145.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.145.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.146.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.146.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.146.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.146.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.146.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.146.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.147.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.147.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.147.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.147.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.147.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.147.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.148.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.148.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.148.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.148.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.148.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.148.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.149.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.149.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.149.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.149.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.149.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.149.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.15.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.15.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.15.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.15.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.15.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.15.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.150.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.150.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.150.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.150.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.150.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.150.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.151.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.151.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.151.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.151.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.151.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.151.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.152.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.152.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.152.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.152.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.152.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.152.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.153.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.153.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.153.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.153.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.153.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.153.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.154.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.154.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.154.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.154.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.154.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.154.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.155.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.155.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.155.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.155.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.155.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.155.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.156.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.156.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.156.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.156.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.156.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.156.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.157.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.157.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.157.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.157.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.157.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.157.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.158.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.158.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.158.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.158.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.158.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.158.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.159.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.159.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.159.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.159.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.159.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.159.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.16.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.16.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.16.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.16.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.16.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.16.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.17.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.17.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.17.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.17.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.17.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.17.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.18.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.18.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.18.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.18.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.18.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.18.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.19.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.19.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.19.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.19.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.19.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.19.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.2.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.2.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.2.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.2.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.2.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.2.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.20.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.20.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.20.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.20.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.20.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.20.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.21.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.21.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.21.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.21.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.21.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.21.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.22.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.22.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.22.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.22.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.22.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.22.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.23.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.23.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.23.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.23.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.23.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.23.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.24.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.24.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.24.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.24.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.24.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.24.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.25.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.25.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.25.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.25.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.25.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.25.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.26.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.26.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.26.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.26.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.26.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.26.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.27.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.27.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.27.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.27.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.27.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.27.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.28.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.28.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.28.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.28.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.28.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.28.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.29.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.29.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.29.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.29.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.29.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.29.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.3.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.3.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.3.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.3.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.3.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.3.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.30.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.30.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.30.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.30.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.30.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.30.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.31.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.31.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.31.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.31.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.31.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.31.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.32.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.32.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.32.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.32.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.32.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.32.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.33.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.33.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.33.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.33.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.33.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.33.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.34.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.34.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.34.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.34.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.34.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.34.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.35.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.35.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.35.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.35.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.35.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.35.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.36.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.36.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.36.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.36.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.36.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.36.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.37.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.37.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.37.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.37.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.37.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.37.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.38.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.38.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.38.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.38.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.38.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.38.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.39.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.39.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.39.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.39.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.39.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.39.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.4.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.4.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.4.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.4.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.4.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.4.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.40.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.40.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.40.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.40.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.40.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.40.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.41.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.41.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.41.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.41.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.41.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.41.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.42.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.42.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.42.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.42.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.42.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.42.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.43.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.43.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.43.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.43.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.43.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.43.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.44.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.44.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.44.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.44.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.44.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.44.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.45.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.45.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.45.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.45.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.45.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.45.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.46.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.46.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.46.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.46.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.46.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.46.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.47.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.47.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.47.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.47.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.47.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.47.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.48.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.48.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.48.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.48.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.48.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.48.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.49.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.49.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.49.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.49.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.49.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.49.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.5.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.5.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.5.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.5.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.5.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.5.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.50.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.50.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.50.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.50.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.50.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.50.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.51.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.51.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.51.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.51.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.51.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.51.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.52.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.52.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.52.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.52.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.52.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.52.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.53.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.53.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.53.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.53.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.53.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.53.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.54.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.54.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.54.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.54.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.54.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.54.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.55.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.55.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.55.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.55.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.55.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.55.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.56.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.56.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.56.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.56.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.56.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.56.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.57.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.57.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.57.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.57.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.57.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.57.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.58.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.58.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.58.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.58.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.58.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.58.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.59.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.59.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.59.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.59.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.59.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.59.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.6.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.6.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.6.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.6.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.6.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.6.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.60.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.60.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.60.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.60.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.60.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.60.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.61.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.61.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.61.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.61.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.61.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.61.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.62.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.62.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.62.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.62.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.62.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.62.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.63.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.63.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.63.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.63.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.63.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.63.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.64.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.64.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.64.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.64.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.64.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.64.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.65.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.65.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.65.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.65.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.65.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.65.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.66.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.66.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.66.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.66.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.66.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.66.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.67.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.67.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.67.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.67.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.67.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.67.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.68.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.68.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.68.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.68.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.68.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.68.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.69.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.69.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.69.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.69.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.69.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.69.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.7.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.7.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.7.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.7.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.7.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.7.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.70.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.70.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.70.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.70.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.70.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.70.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.71.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.71.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.71.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.71.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.71.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.71.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.72.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.72.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.72.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.72.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.72.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.72.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.73.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.73.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.73.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.73.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.73.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.73.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.74.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.74.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.74.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.74.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.74.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.74.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.75.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.75.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.75.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.75.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.75.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.75.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.76.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.76.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.76.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.76.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.76.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.76.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.77.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.77.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.77.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.77.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.77.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.77.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.78.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.78.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.78.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.78.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.78.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.78.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.79.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.79.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.79.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.79.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.79.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.79.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.8.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.8.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.8.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.8.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.8.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.8.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.80.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.80.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.80.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.80.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.80.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.80.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.81.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.81.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.81.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.81.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.81.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.81.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.82.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.82.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.82.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.82.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.82.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.82.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.83.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.83.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.83.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.83.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.83.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.83.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.84.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.84.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.84.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.84.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.84.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.84.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.85.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.85.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.85.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.85.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.85.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.85.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.86.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.86.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.86.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.86.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.86.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.86.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.87.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.87.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.87.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.87.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.87.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.87.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.88.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.88.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.88.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.88.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.88.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.88.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.89.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.89.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.89.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.89.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.89.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.89.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.9.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.9.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.9.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.9.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.9.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.9.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.90.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.90.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.90.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.90.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.90.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.90.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.91.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.91.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.91.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.91.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.91.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.91.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.92.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.92.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.92.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.92.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.92.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.92.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.93.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.93.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.93.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.93.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.93.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.93.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.94.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.94.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.94.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.94.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.94.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.94.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.95.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.95.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.95.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.95.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.95.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.95.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.96.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.96.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.96.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.96.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.96.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.96.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.97.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.97.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.97.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.97.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.97.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.97.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.98.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.98.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.98.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.98.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.98.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.98.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.99.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.99.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.99.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.99.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.99.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.experts.99.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.gate.e_score_correction_bias": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.gate.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.shared_experts.down_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.shared_experts.down_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.shared_experts.gate_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.shared_experts.gate_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.shared_experts.up_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.mlp.shared_experts.up_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.post_attention_layernorm.weight": "model-00017-of-00092.safetensors", + "model.layers.16.self_attn.k_norm.weight": "model-00017-of-00092.safetensors", + "model.layers.16.self_attn.k_proj.bias": "model-00017-of-00092.safetensors", + "model.layers.16.self_attn.k_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.self_attn.k_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.self_attn.o_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.self_attn.o_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.self_attn.q_norm.weight": "model-00017-of-00092.safetensors", + "model.layers.16.self_attn.q_proj.bias": "model-00017-of-00092.safetensors", + "model.layers.16.self_attn.q_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.self_attn.q_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.16.self_attn.v_proj.bias": "model-00017-of-00092.safetensors", + "model.layers.16.self_attn.v_proj.weight": "model-00017-of-00092.safetensors", + "model.layers.16.self_attn.v_proj.weight_scale": "model-00017-of-00092.safetensors", + "model.layers.17.input_layernorm.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.0.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.0.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.0.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.0.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.0.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.0.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.1.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.1.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.1.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.1.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.1.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.1.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.10.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.10.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.10.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.10.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.10.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.10.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.100.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.100.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.100.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.100.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.100.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.100.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.101.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.101.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.101.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.101.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.101.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.101.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.102.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.102.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.102.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.102.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.102.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.102.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.103.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.103.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.103.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.103.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.103.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.103.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.104.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.104.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.104.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.104.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.104.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.104.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.105.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.105.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.105.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.105.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.105.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.105.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.106.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.106.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.106.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.106.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.106.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.106.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.107.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.107.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.107.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.107.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.107.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.107.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.108.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.108.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.108.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.108.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.108.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.108.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.109.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.109.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.109.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.109.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.109.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.109.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.11.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.11.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.11.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.11.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.11.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.11.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.110.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.110.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.110.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.110.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.110.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.110.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.111.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.111.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.111.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.111.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.111.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.111.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.112.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.112.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.112.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.112.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.112.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.112.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.113.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.113.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.113.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.113.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.113.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.113.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.114.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.114.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.114.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.114.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.114.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.114.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.115.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.115.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.115.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.115.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.115.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.115.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.116.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.116.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.116.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.116.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.116.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.116.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.117.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.117.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.117.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.117.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.117.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.117.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.118.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.118.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.118.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.118.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.118.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.118.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.119.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.119.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.119.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.119.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.119.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.119.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.12.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.12.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.12.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.12.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.12.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.12.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.120.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.120.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.120.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.120.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.120.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.120.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.121.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.121.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.121.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.121.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.121.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.121.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.122.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.122.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.122.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.122.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.122.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.122.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.123.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.123.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.123.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.123.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.123.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.123.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.124.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.124.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.124.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.124.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.124.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.124.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.125.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.125.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.125.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.125.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.125.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.125.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.126.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.126.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.126.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.126.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.126.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.126.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.127.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.127.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.127.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.127.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.127.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.127.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.128.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.128.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.128.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.128.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.128.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.128.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.129.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.129.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.129.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.129.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.129.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.129.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.13.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.13.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.13.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.13.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.13.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.13.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.130.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.130.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.130.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.130.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.130.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.130.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.131.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.131.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.131.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.131.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.131.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.131.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.132.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.132.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.132.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.132.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.132.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.132.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.133.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.133.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.133.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.133.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.133.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.133.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.134.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.134.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.134.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.134.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.134.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.134.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.135.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.135.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.135.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.135.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.135.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.135.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.136.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.136.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.136.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.136.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.136.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.136.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.137.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.137.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.137.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.137.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.137.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.137.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.138.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.138.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.138.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.138.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.138.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.138.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.139.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.139.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.139.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.139.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.139.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.139.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.14.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.14.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.14.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.14.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.14.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.14.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.140.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.140.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.140.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.140.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.140.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.140.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.141.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.141.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.141.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.141.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.141.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.141.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.142.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.142.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.142.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.142.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.142.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.142.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.143.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.143.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.143.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.143.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.143.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.143.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.144.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.144.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.144.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.144.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.144.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.144.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.145.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.145.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.145.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.145.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.145.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.145.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.146.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.146.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.146.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.146.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.146.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.146.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.147.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.147.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.147.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.147.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.147.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.147.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.148.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.148.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.148.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.148.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.148.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.148.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.149.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.149.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.149.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.149.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.149.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.149.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.15.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.15.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.15.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.15.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.15.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.15.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.150.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.150.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.150.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.150.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.150.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.150.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.151.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.151.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.151.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.151.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.151.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.151.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.152.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.152.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.152.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.152.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.152.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.152.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.153.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.153.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.153.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.153.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.153.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.153.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.154.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.154.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.154.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.154.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.154.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.154.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.155.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.155.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.155.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.155.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.155.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.155.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.156.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.156.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.156.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.156.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.156.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.156.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.157.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.157.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.157.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.157.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.157.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.157.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.158.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.158.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.158.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.158.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.158.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.158.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.159.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.159.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.159.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.159.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.159.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.159.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.16.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.16.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.16.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.16.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.16.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.16.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.17.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.17.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.17.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.17.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.17.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.17.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.18.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.18.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.18.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.18.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.18.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.18.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.19.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.19.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.19.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.19.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.19.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.19.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.2.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.2.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.2.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.2.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.2.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.2.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.20.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.20.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.20.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.20.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.20.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.20.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.21.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.21.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.21.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.21.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.21.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.21.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.22.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.22.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.22.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.22.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.22.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.22.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.23.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.23.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.23.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.23.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.23.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.23.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.24.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.24.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.24.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.24.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.24.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.24.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.25.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.25.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.25.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.25.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.25.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.25.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.26.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.26.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.26.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.26.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.26.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.26.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.27.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.27.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.27.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.27.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.27.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.27.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.28.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.28.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.28.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.28.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.28.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.28.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.29.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.29.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.29.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.29.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.29.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.29.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.3.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.3.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.3.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.3.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.3.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.3.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.30.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.30.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.30.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.30.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.30.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.30.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.31.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.31.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.31.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.31.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.31.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.31.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.32.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.32.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.32.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.32.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.32.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.32.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.33.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.33.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.33.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.33.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.33.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.33.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.34.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.34.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.34.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.34.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.34.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.34.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.35.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.35.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.35.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.35.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.35.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.35.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.36.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.36.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.36.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.36.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.36.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.36.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.37.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.37.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.37.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.37.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.37.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.37.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.38.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.38.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.38.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.38.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.38.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.38.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.39.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.39.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.39.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.39.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.39.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.39.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.4.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.4.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.4.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.4.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.4.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.4.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.40.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.40.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.40.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.40.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.40.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.40.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.41.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.41.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.41.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.41.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.41.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.41.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.42.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.42.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.42.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.42.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.42.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.42.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.43.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.43.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.43.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.43.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.43.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.43.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.44.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.44.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.44.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.44.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.44.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.44.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.45.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.45.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.45.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.45.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.45.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.45.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.46.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.46.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.46.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.46.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.46.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.46.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.47.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.47.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.47.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.47.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.47.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.47.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.48.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.48.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.48.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.48.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.48.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.48.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.49.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.49.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.49.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.49.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.49.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.49.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.5.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.5.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.5.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.5.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.5.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.5.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.50.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.50.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.50.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.50.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.50.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.50.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.51.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.51.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.51.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.51.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.51.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.51.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.52.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.52.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.52.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.52.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.52.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.52.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.53.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.53.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.53.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.53.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.53.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.53.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.54.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.54.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.54.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.54.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.54.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.54.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.55.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.55.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.55.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.55.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.55.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.55.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.56.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.56.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.56.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.56.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.56.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.56.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.57.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.57.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.57.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.57.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.57.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.57.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.58.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.58.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.58.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.58.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.58.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.58.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.59.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.59.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.59.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.59.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.59.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.59.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.6.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.6.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.6.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.6.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.6.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.6.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.60.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.60.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.60.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.60.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.60.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.60.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.61.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.61.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.61.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.61.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.61.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.61.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.62.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.62.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.62.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.62.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.62.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.62.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.63.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.63.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.63.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.63.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.63.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.63.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.64.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.64.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.64.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.64.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.64.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.64.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.65.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.65.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.65.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.65.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.65.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.65.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.66.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.66.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.66.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.66.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.66.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.66.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.67.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.67.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.67.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.67.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.67.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.67.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.68.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.68.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.68.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.68.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.68.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.68.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.69.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.69.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.69.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.69.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.69.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.69.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.7.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.7.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.7.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.7.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.7.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.7.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.70.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.70.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.70.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.70.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.70.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.70.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.71.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.71.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.71.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.71.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.71.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.71.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.72.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.72.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.72.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.72.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.72.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.72.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.73.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.73.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.73.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.73.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.73.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.73.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.74.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.74.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.74.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.74.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.74.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.74.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.75.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.75.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.75.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.75.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.75.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.75.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.76.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.76.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.76.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.76.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.76.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.76.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.77.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.77.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.77.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.77.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.77.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.77.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.78.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.78.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.78.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.78.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.78.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.78.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.79.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.79.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.79.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.79.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.79.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.79.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.8.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.8.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.8.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.8.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.8.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.8.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.80.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.80.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.80.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.80.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.80.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.80.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.81.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.81.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.81.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.81.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.81.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.81.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.82.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.82.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.82.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.82.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.82.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.82.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.83.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.83.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.83.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.83.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.83.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.83.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.84.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.84.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.84.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.84.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.84.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.84.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.85.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.85.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.85.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.85.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.85.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.85.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.86.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.86.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.86.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.86.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.86.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.86.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.87.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.87.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.87.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.87.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.87.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.87.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.88.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.88.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.88.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.88.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.88.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.88.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.89.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.89.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.89.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.89.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.89.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.89.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.9.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.9.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.9.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.9.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.9.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.9.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.90.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.90.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.90.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.90.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.90.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.90.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.91.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.91.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.91.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.91.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.91.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.91.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.92.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.92.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.92.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.92.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.92.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.92.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.93.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.93.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.93.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.93.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.93.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.93.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.94.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.94.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.94.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.94.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.94.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.94.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.95.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.95.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.95.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.95.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.95.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.95.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.96.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.96.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.96.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.96.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.96.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.96.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.97.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.97.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.97.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.97.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.97.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.97.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.98.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.98.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.98.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.98.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.98.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.98.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.99.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.99.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.99.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.99.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.99.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.experts.99.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.gate.e_score_correction_bias": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.gate.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.shared_experts.down_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.shared_experts.down_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.shared_experts.gate_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.shared_experts.gate_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.shared_experts.up_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.mlp.shared_experts.up_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.post_attention_layernorm.weight": "model-00018-of-00092.safetensors", + "model.layers.17.self_attn.k_norm.weight": "model-00018-of-00092.safetensors", + "model.layers.17.self_attn.k_proj.bias": "model-00018-of-00092.safetensors", + "model.layers.17.self_attn.k_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.self_attn.k_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.self_attn.o_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.self_attn.o_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.self_attn.q_norm.weight": "model-00018-of-00092.safetensors", + "model.layers.17.self_attn.q_proj.bias": "model-00018-of-00092.safetensors", + "model.layers.17.self_attn.q_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.self_attn.q_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.17.self_attn.v_proj.bias": "model-00018-of-00092.safetensors", + "model.layers.17.self_attn.v_proj.weight": "model-00018-of-00092.safetensors", + "model.layers.17.self_attn.v_proj.weight_scale": "model-00018-of-00092.safetensors", + "model.layers.18.input_layernorm.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.0.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.0.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.0.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.0.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.0.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.0.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.1.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.1.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.1.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.1.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.1.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.1.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.10.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.10.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.10.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.10.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.10.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.10.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.100.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.100.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.100.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.100.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.100.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.100.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.101.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.101.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.101.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.101.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.101.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.101.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.102.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.102.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.102.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.102.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.102.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.102.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.103.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.103.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.103.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.103.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.103.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.103.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.104.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.104.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.104.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.104.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.104.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.104.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.105.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.105.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.105.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.105.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.105.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.105.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.106.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.106.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.106.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.106.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.106.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.106.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.107.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.107.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.107.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.107.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.107.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.107.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.108.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.108.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.108.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.108.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.108.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.108.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.109.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.109.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.109.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.109.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.109.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.109.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.11.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.11.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.11.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.11.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.11.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.11.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.110.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.110.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.110.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.110.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.110.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.110.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.111.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.111.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.111.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.111.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.111.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.111.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.112.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.112.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.112.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.112.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.112.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.112.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.113.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.113.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.113.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.113.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.113.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.113.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.114.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.114.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.114.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.114.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.114.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.114.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.115.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.115.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.115.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.115.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.115.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.115.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.116.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.116.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.116.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.116.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.116.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.116.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.117.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.117.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.117.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.117.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.117.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.117.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.118.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.118.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.118.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.118.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.118.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.118.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.119.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.119.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.119.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.119.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.119.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.119.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.12.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.12.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.12.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.12.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.12.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.12.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.120.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.120.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.120.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.120.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.120.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.120.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.121.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.121.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.121.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.121.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.121.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.121.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.122.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.122.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.122.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.122.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.122.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.122.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.123.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.123.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.123.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.123.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.123.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.123.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.124.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.124.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.124.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.124.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.124.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.124.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.125.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.125.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.125.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.125.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.125.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.125.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.126.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.126.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.126.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.126.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.126.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.126.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.127.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.127.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.127.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.127.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.127.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.127.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.128.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.128.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.128.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.128.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.128.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.128.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.129.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.129.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.129.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.129.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.129.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.129.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.13.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.13.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.13.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.13.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.13.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.13.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.130.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.130.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.130.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.130.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.130.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.130.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.131.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.131.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.131.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.131.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.131.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.131.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.132.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.132.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.132.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.132.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.132.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.132.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.133.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.133.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.133.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.133.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.133.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.133.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.134.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.134.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.134.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.134.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.134.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.134.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.135.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.135.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.135.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.135.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.135.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.135.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.136.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.136.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.136.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.136.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.136.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.136.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.137.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.137.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.137.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.137.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.137.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.137.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.138.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.138.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.138.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.138.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.138.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.138.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.139.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.139.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.139.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.139.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.139.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.139.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.14.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.14.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.14.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.14.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.14.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.14.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.140.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.140.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.140.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.140.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.140.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.140.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.141.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.141.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.141.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.141.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.141.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.141.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.142.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.142.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.142.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.142.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.142.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.142.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.143.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.143.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.143.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.143.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.143.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.143.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.144.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.144.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.144.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.144.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.144.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.144.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.145.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.145.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.145.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.145.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.145.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.145.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.146.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.146.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.146.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.146.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.146.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.146.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.147.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.147.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.147.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.147.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.147.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.147.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.148.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.148.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.148.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.148.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.148.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.148.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.149.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.149.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.149.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.149.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.149.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.149.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.15.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.15.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.15.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.15.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.15.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.15.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.150.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.150.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.150.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.150.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.150.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.150.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.151.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.151.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.151.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.151.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.151.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.151.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.152.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.152.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.152.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.152.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.152.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.152.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.153.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.153.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.153.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.153.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.153.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.153.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.154.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.154.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.154.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.154.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.154.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.154.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.155.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.155.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.155.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.155.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.155.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.155.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.156.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.156.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.156.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.156.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.156.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.156.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.157.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.157.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.157.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.157.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.157.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.157.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.158.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.158.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.158.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.158.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.158.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.158.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.159.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.159.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.159.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.159.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.159.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.159.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.16.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.16.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.16.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.16.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.16.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.16.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.17.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.17.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.17.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.17.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.17.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.17.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.18.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.18.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.18.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.18.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.18.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.18.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.19.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.19.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.19.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.19.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.19.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.19.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.2.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.2.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.2.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.2.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.2.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.2.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.20.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.20.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.20.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.20.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.20.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.20.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.21.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.21.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.21.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.21.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.21.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.21.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.22.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.22.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.22.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.22.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.22.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.22.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.23.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.23.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.23.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.23.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.23.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.23.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.24.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.24.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.24.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.24.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.24.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.24.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.25.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.25.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.25.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.25.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.25.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.25.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.26.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.26.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.26.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.26.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.26.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.26.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.27.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.27.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.27.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.27.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.27.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.27.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.28.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.28.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.28.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.28.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.28.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.28.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.29.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.29.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.29.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.29.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.29.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.29.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.3.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.3.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.3.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.3.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.3.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.3.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.30.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.30.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.30.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.30.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.30.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.30.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.31.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.31.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.31.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.31.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.31.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.31.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.32.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.32.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.32.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.32.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.32.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.32.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.33.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.33.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.33.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.33.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.33.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.33.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.34.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.34.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.34.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.34.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.34.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.34.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.35.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.35.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.35.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.35.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.35.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.35.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.36.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.36.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.36.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.36.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.36.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.36.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.37.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.37.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.37.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.37.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.37.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.37.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.38.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.38.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.38.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.38.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.38.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.38.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.39.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.39.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.39.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.39.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.39.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.39.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.4.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.4.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.4.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.4.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.4.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.4.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.40.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.40.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.40.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.40.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.40.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.40.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.41.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.41.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.41.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.41.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.41.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.41.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.42.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.42.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.42.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.42.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.42.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.42.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.43.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.43.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.43.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.43.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.43.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.43.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.44.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.44.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.44.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.44.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.44.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.44.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.45.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.45.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.45.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.45.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.45.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.45.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.46.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.46.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.46.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.46.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.46.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.46.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.47.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.47.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.47.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.47.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.47.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.47.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.48.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.48.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.48.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.48.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.48.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.48.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.49.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.49.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.49.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.49.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.49.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.49.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.5.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.5.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.5.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.5.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.5.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.5.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.50.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.50.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.50.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.50.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.50.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.50.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.51.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.51.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.51.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.51.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.51.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.51.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.52.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.52.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.52.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.52.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.52.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.52.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.53.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.53.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.53.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.53.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.53.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.53.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.54.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.54.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.54.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.54.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.54.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.54.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.55.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.55.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.55.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.55.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.55.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.55.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.56.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.56.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.56.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.56.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.56.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.56.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.57.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.57.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.57.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.57.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.57.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.57.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.58.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.58.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.58.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.58.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.58.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.58.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.59.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.59.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.59.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.59.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.59.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.59.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.6.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.6.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.6.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.6.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.6.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.6.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.60.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.60.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.60.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.60.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.60.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.60.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.61.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.61.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.61.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.61.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.61.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.61.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.62.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.62.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.62.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.62.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.62.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.62.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.63.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.63.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.63.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.63.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.63.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.63.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.64.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.64.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.64.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.64.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.64.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.64.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.65.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.65.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.65.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.65.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.65.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.65.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.66.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.66.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.66.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.66.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.66.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.66.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.67.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.67.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.67.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.67.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.67.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.67.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.68.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.68.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.68.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.68.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.68.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.68.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.69.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.69.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.69.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.69.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.69.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.69.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.7.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.7.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.7.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.7.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.7.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.7.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.70.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.70.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.70.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.70.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.70.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.70.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.71.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.71.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.71.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.71.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.71.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.71.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.72.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.72.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.72.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.72.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.72.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.72.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.73.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.73.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.73.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.73.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.73.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.73.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.74.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.74.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.74.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.74.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.74.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.74.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.75.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.75.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.75.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.75.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.75.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.75.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.76.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.76.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.76.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.76.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.76.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.76.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.77.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.77.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.77.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.77.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.77.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.77.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.78.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.78.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.78.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.78.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.78.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.78.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.79.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.79.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.79.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.79.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.79.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.79.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.8.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.8.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.8.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.8.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.8.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.8.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.80.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.80.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.80.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.80.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.80.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.80.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.81.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.81.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.81.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.81.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.81.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.81.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.82.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.82.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.82.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.82.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.82.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.82.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.83.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.83.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.83.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.83.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.83.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.83.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.84.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.84.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.84.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.84.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.84.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.84.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.85.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.85.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.85.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.85.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.85.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.85.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.86.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.86.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.86.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.86.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.86.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.86.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.87.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.87.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.87.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.87.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.87.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.87.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.88.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.88.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.88.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.88.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.88.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.88.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.89.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.89.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.89.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.89.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.89.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.89.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.9.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.9.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.9.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.9.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.9.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.9.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.90.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.90.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.90.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.90.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.90.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.90.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.91.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.91.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.91.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.91.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.91.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.91.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.92.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.92.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.92.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.92.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.92.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.92.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.93.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.93.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.93.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.93.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.93.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.93.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.94.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.94.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.94.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.94.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.94.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.94.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.95.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.95.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.95.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.95.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.95.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.95.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.96.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.96.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.96.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.96.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.96.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.96.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.97.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.97.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.97.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.97.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.97.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.97.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.98.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.98.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.98.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.98.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.98.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.98.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.99.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.99.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.99.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.99.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.99.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.experts.99.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.gate.e_score_correction_bias": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.gate.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.shared_experts.down_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.shared_experts.down_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.shared_experts.gate_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.shared_experts.gate_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.shared_experts.up_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.mlp.shared_experts.up_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.post_attention_layernorm.weight": "model-00019-of-00092.safetensors", + "model.layers.18.self_attn.k_norm.weight": "model-00019-of-00092.safetensors", + "model.layers.18.self_attn.k_proj.bias": "model-00019-of-00092.safetensors", + "model.layers.18.self_attn.k_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.self_attn.k_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.self_attn.o_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.self_attn.o_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.self_attn.q_norm.weight": "model-00019-of-00092.safetensors", + "model.layers.18.self_attn.q_proj.bias": "model-00019-of-00092.safetensors", + "model.layers.18.self_attn.q_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.self_attn.q_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.18.self_attn.v_proj.bias": "model-00019-of-00092.safetensors", + "model.layers.18.self_attn.v_proj.weight": "model-00019-of-00092.safetensors", + "model.layers.18.self_attn.v_proj.weight_scale": "model-00019-of-00092.safetensors", + "model.layers.19.input_layernorm.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.0.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.0.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.0.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.0.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.0.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.0.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.1.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.1.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.1.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.1.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.1.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.1.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.10.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.10.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.10.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.10.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.10.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.10.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.100.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.100.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.100.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.100.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.100.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.100.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.101.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.101.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.101.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.101.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.101.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.101.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.102.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.102.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.102.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.102.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.102.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.102.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.103.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.103.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.103.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.103.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.103.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.103.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.104.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.104.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.104.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.104.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.104.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.104.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.105.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.105.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.105.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.105.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.105.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.105.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.106.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.106.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.106.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.106.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.106.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.106.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.107.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.107.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.107.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.107.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.107.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.107.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.108.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.108.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.108.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.108.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.108.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.108.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.109.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.109.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.109.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.109.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.109.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.109.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.11.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.11.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.11.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.11.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.11.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.11.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.110.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.110.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.110.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.110.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.110.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.110.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.111.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.111.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.111.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.111.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.111.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.111.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.112.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.112.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.112.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.112.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.112.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.112.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.113.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.113.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.113.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.113.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.113.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.113.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.114.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.114.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.114.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.114.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.114.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.114.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.115.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.115.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.115.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.115.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.115.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.115.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.116.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.116.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.116.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.116.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.116.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.116.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.117.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.117.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.117.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.117.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.117.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.117.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.118.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.118.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.118.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.118.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.118.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.118.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.119.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.119.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.119.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.119.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.119.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.119.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.12.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.12.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.12.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.12.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.12.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.12.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.120.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.120.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.120.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.120.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.120.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.120.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.121.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.121.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.121.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.121.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.121.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.121.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.122.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.122.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.122.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.122.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.122.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.122.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.123.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.123.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.123.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.123.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.123.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.123.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.124.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.124.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.124.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.124.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.124.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.124.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.125.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.125.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.125.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.125.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.125.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.125.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.126.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.126.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.126.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.126.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.126.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.126.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.127.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.127.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.127.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.127.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.127.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.127.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.128.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.128.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.128.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.128.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.128.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.128.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.129.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.129.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.129.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.129.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.129.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.129.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.13.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.13.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.13.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.13.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.13.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.13.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.130.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.130.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.130.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.130.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.130.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.130.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.131.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.131.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.131.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.131.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.131.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.131.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.132.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.132.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.132.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.132.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.132.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.132.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.133.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.133.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.133.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.133.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.133.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.133.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.134.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.134.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.134.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.134.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.134.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.134.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.135.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.135.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.135.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.135.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.135.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.135.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.136.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.136.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.136.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.136.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.136.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.136.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.137.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.137.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.137.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.137.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.137.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.137.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.138.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.138.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.138.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.138.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.138.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.138.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.139.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.139.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.139.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.139.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.139.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.139.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.14.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.14.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.14.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.14.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.14.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.14.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.140.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.140.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.140.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.140.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.140.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.140.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.141.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.141.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.141.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.141.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.141.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.141.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.142.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.142.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.142.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.142.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.142.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.142.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.143.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.143.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.143.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.143.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.143.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.143.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.144.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.144.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.144.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.144.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.144.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.144.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.145.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.145.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.145.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.145.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.145.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.145.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.146.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.146.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.146.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.146.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.146.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.146.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.147.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.147.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.147.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.147.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.147.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.147.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.148.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.148.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.148.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.148.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.148.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.148.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.149.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.149.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.149.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.149.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.149.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.149.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.15.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.15.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.15.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.15.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.15.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.15.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.150.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.150.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.150.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.150.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.150.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.150.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.151.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.151.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.151.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.151.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.151.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.151.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.152.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.152.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.152.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.152.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.152.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.152.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.153.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.153.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.153.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.153.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.153.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.153.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.154.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.154.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.154.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.154.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.154.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.154.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.155.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.155.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.155.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.155.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.155.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.155.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.156.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.156.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.156.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.156.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.156.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.156.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.157.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.157.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.157.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.157.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.157.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.157.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.158.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.158.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.158.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.158.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.158.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.158.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.159.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.159.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.159.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.159.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.159.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.159.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.16.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.16.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.16.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.16.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.16.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.16.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.17.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.17.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.17.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.17.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.17.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.17.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.18.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.18.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.18.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.18.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.18.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.18.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.19.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.19.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.19.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.19.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.19.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.19.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.2.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.2.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.2.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.2.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.2.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.2.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.20.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.20.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.20.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.20.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.20.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.20.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.21.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.21.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.21.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.21.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.21.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.21.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.22.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.22.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.22.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.22.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.22.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.22.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.23.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.23.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.23.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.23.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.23.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.23.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.24.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.24.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.24.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.24.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.24.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.24.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.25.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.25.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.25.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.25.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.25.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.25.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.26.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.26.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.26.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.26.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.26.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.26.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.27.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.27.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.27.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.27.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.27.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.27.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.28.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.28.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.28.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.28.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.28.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.28.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.29.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.29.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.29.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.29.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.29.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.29.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.3.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.3.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.3.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.3.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.3.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.3.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.30.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.30.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.30.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.30.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.30.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.30.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.31.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.31.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.31.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.31.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.31.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.31.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.32.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.32.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.32.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.32.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.32.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.32.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.33.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.33.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.33.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.33.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.33.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.33.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.34.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.34.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.34.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.34.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.34.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.34.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.35.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.35.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.35.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.35.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.35.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.35.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.36.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.36.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.36.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.36.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.36.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.36.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.37.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.37.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.37.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.37.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.37.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.37.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.38.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.38.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.38.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.38.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.38.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.38.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.39.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.39.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.39.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.39.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.39.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.39.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.4.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.4.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.4.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.4.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.4.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.4.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.40.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.40.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.40.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.40.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.40.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.40.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.41.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.41.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.41.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.41.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.41.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.41.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.42.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.42.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.42.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.42.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.42.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.42.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.43.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.43.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.43.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.43.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.43.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.43.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.44.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.44.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.44.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.44.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.44.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.44.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.45.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.45.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.45.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.45.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.45.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.45.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.46.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.46.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.46.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.46.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.46.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.46.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.47.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.47.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.47.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.47.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.47.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.47.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.48.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.48.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.48.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.48.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.48.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.48.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.49.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.49.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.49.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.49.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.49.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.49.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.5.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.5.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.5.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.5.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.5.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.5.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.50.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.50.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.50.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.50.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.50.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.50.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.51.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.51.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.51.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.51.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.51.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.51.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.52.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.52.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.52.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.52.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.52.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.52.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.53.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.53.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.53.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.53.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.53.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.53.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.54.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.54.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.54.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.54.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.54.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.54.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.55.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.55.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.55.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.55.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.55.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.55.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.56.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.56.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.56.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.56.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.56.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.56.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.57.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.57.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.57.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.57.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.57.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.57.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.58.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.58.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.58.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.58.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.58.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.58.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.59.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.59.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.59.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.59.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.59.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.59.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.6.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.6.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.6.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.6.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.6.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.6.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.60.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.60.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.60.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.60.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.60.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.60.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.61.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.61.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.61.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.61.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.61.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.61.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.62.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.62.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.62.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.62.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.62.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.62.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.63.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.63.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.63.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.63.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.63.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.63.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.64.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.64.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.64.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.64.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.64.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.64.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.65.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.65.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.65.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.65.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.65.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.65.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.66.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.66.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.66.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.66.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.66.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.66.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.67.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.67.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.67.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.67.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.67.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.67.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.68.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.68.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.68.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.68.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.68.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.68.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.69.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.69.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.69.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.69.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.69.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.69.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.7.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.7.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.7.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.7.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.7.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.7.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.70.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.70.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.70.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.70.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.70.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.70.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.71.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.71.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.71.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.71.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.71.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.71.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.72.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.72.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.72.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.72.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.72.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.72.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.73.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.73.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.73.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.73.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.73.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.73.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.74.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.74.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.74.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.74.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.74.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.74.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.75.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.75.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.75.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.75.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.75.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.75.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.76.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.76.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.76.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.76.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.76.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.76.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.77.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.77.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.77.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.77.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.77.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.77.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.78.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.78.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.78.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.78.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.78.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.78.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.79.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.79.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.79.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.79.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.79.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.79.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.8.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.8.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.8.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.8.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.8.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.8.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.80.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.80.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.80.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.80.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.80.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.80.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.81.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.81.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.81.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.81.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.81.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.81.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.82.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.82.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.82.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.82.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.82.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.82.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.83.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.83.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.83.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.83.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.83.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.83.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.84.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.84.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.84.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.84.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.84.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.84.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.85.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.85.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.85.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.85.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.85.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.85.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.86.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.86.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.86.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.86.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.86.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.86.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.87.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.87.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.87.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.87.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.87.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.87.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.88.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.88.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.88.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.88.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.88.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.88.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.89.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.89.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.89.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.89.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.89.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.89.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.9.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.9.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.9.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.9.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.9.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.9.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.90.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.90.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.90.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.90.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.90.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.90.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.91.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.91.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.91.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.91.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.91.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.91.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.92.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.92.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.92.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.92.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.92.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.92.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.93.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.93.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.93.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.93.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.93.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.93.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.94.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.94.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.94.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.94.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.94.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.94.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.95.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.95.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.95.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.95.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.95.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.95.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.96.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.96.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.96.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.96.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.96.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.96.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.97.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.97.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.97.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.97.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.97.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.97.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.98.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.98.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.98.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.98.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.98.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.98.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.99.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.99.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.99.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.99.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.99.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.experts.99.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.gate.e_score_correction_bias": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.gate.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.shared_experts.down_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.shared_experts.down_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.shared_experts.gate_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.shared_experts.gate_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.shared_experts.up_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.mlp.shared_experts.up_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.post_attention_layernorm.weight": "model-00020-of-00092.safetensors", + "model.layers.19.self_attn.k_norm.weight": "model-00020-of-00092.safetensors", + "model.layers.19.self_attn.k_proj.bias": "model-00020-of-00092.safetensors", + "model.layers.19.self_attn.k_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.self_attn.k_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.self_attn.o_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.self_attn.o_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.self_attn.q_norm.weight": "model-00020-of-00092.safetensors", + "model.layers.19.self_attn.q_proj.bias": "model-00020-of-00092.safetensors", + "model.layers.19.self_attn.q_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.self_attn.q_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.19.self_attn.v_proj.bias": "model-00020-of-00092.safetensors", + "model.layers.19.self_attn.v_proj.weight": "model-00020-of-00092.safetensors", + "model.layers.19.self_attn.v_proj.weight_scale": "model-00020-of-00092.safetensors", + "model.layers.20.input_layernorm.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.0.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.0.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.0.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.0.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.0.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.0.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.1.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.1.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.1.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.1.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.1.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.1.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.10.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.10.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.10.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.10.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.10.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.10.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.100.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.100.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.100.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.100.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.100.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.100.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.101.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.101.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.101.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.101.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.101.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.101.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.102.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.102.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.102.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.102.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.102.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.102.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.103.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.103.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.103.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.103.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.103.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.103.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.104.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.104.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.104.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.104.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.104.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.104.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.105.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.105.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.105.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.105.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.105.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.105.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.106.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.106.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.106.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.106.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.106.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.106.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.107.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.107.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.107.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.107.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.107.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.107.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.108.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.108.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.108.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.108.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.108.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.108.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.109.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.109.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.109.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.109.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.109.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.109.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.11.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.11.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.11.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.11.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.11.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.11.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.110.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.110.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.110.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.110.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.110.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.110.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.111.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.111.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.111.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.111.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.111.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.111.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.112.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.112.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.112.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.112.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.112.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.112.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.113.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.113.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.113.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.113.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.113.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.113.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.114.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.114.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.114.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.114.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.114.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.114.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.115.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.115.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.115.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.115.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.115.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.115.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.116.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.116.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.116.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.116.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.116.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.116.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.117.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.117.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.117.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.117.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.117.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.117.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.118.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.118.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.118.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.118.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.118.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.118.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.119.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.119.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.119.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.119.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.119.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.119.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.12.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.12.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.12.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.12.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.12.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.12.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.120.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.120.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.120.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.120.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.120.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.120.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.121.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.121.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.121.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.121.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.121.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.121.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.122.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.122.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.122.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.122.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.122.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.122.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.123.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.123.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.123.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.123.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.123.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.123.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.124.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.124.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.124.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.124.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.124.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.124.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.125.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.125.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.125.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.125.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.125.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.125.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.126.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.126.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.126.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.126.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.126.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.126.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.127.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.127.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.127.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.127.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.127.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.127.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.128.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.128.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.128.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.128.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.128.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.128.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.129.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.129.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.129.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.129.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.129.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.129.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.13.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.13.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.13.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.13.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.13.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.13.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.130.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.130.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.130.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.130.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.130.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.130.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.131.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.131.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.131.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.131.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.131.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.131.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.132.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.132.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.132.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.132.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.132.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.132.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.133.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.133.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.133.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.133.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.133.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.133.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.134.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.134.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.134.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.134.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.134.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.134.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.135.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.135.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.135.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.135.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.135.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.135.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.136.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.136.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.136.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.136.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.136.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.136.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.137.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.137.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.137.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.137.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.137.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.137.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.138.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.138.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.138.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.138.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.138.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.138.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.139.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.139.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.139.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.139.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.139.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.139.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.14.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.14.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.14.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.14.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.14.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.14.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.140.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.140.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.140.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.140.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.140.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.140.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.141.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.141.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.141.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.141.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.141.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.141.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.142.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.142.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.142.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.142.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.142.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.142.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.143.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.143.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.143.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.143.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.143.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.143.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.144.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.144.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.144.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.144.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.144.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.144.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.145.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.145.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.145.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.145.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.145.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.145.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.146.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.146.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.146.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.146.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.146.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.146.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.147.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.147.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.147.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.147.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.147.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.147.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.148.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.148.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.148.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.148.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.148.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.148.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.149.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.149.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.149.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.149.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.149.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.149.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.15.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.15.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.15.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.15.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.15.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.15.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.150.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.150.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.150.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.150.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.150.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.150.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.151.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.151.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.151.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.151.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.151.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.151.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.152.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.152.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.152.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.152.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.152.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.152.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.153.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.153.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.153.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.153.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.153.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.153.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.154.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.154.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.154.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.154.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.154.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.154.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.155.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.155.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.155.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.155.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.155.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.155.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.156.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.156.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.156.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.156.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.156.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.156.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.157.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.157.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.157.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.157.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.157.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.157.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.158.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.158.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.158.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.158.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.158.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.158.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.159.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.159.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.159.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.159.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.159.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.159.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.16.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.16.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.16.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.16.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.16.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.16.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.17.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.17.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.17.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.17.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.17.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.17.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.18.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.18.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.18.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.18.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.18.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.18.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.19.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.19.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.19.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.19.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.19.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.19.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.2.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.2.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.2.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.2.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.2.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.2.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.20.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.20.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.20.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.20.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.20.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.20.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.21.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.21.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.21.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.21.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.21.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.21.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.22.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.22.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.22.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.22.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.22.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.22.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.23.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.23.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.23.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.23.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.23.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.23.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.24.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.24.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.24.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.24.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.24.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.24.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.25.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.25.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.25.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.25.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.25.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.25.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.26.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.26.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.26.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.26.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.26.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.26.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.27.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.27.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.27.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.27.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.27.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.27.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.28.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.28.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.28.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.28.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.28.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.28.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.29.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.29.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.29.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.29.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.29.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.29.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.3.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.3.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.3.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.3.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.3.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.3.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.30.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.30.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.30.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.30.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.30.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.30.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.31.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.31.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.31.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.31.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.31.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.31.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.32.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.32.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.32.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.32.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.32.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.32.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.33.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.33.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.33.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.33.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.33.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.33.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.34.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.34.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.34.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.34.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.34.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.34.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.35.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.35.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.35.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.35.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.35.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.35.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.36.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.36.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.36.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.36.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.36.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.36.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.37.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.37.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.37.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.37.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.37.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.37.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.38.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.38.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.38.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.38.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.38.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.38.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.39.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.39.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.39.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.39.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.39.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.39.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.4.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.4.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.4.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.4.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.4.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.4.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.40.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.40.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.40.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.40.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.40.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.40.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.41.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.41.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.41.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.41.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.41.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.41.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.42.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.42.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.42.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.42.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.42.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.42.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.43.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.43.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.43.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.43.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.43.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.43.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.44.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.44.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.44.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.44.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.44.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.44.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.45.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.45.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.45.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.45.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.45.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.45.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.46.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.46.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.46.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.46.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.46.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.46.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.47.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.47.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.47.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.47.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.47.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.47.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.48.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.48.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.48.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.48.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.48.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.48.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.49.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.49.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.49.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.49.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.49.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.49.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.5.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.5.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.5.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.5.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.5.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.5.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.50.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.50.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.50.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.50.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.50.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.50.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.51.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.51.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.51.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.51.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.51.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.51.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.52.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.52.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.52.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.52.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.52.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.52.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.53.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.53.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.53.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.53.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.53.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.53.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.54.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.54.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.54.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.54.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.54.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.54.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.55.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.55.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.55.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.55.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.55.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.55.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.56.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.56.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.56.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.56.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.56.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.56.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.57.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.57.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.57.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.57.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.57.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.57.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.58.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.58.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.58.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.58.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.58.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.58.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.59.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.59.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.59.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.59.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.59.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.59.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.6.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.6.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.6.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.6.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.6.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.6.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.60.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.60.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.60.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.60.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.60.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.60.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.61.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.61.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.61.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.61.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.61.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.61.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.62.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.62.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.62.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.62.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.62.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.62.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.63.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.63.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.63.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.63.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.63.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.63.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.64.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.64.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.64.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.64.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.64.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.64.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.65.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.65.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.65.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.65.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.65.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.65.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.66.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.66.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.66.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.66.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.66.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.66.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.67.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.67.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.67.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.67.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.67.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.67.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.68.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.68.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.68.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.68.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.68.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.68.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.69.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.69.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.69.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.69.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.69.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.69.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.7.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.7.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.7.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.7.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.7.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.7.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.70.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.70.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.70.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.70.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.70.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.70.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.71.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.71.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.71.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.71.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.71.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.71.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.72.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.72.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.72.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.72.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.72.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.72.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.73.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.73.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.73.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.73.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.73.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.73.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.74.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.74.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.74.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.74.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.74.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.74.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.75.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.75.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.75.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.75.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.75.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.75.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.76.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.76.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.76.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.76.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.76.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.76.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.77.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.77.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.77.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.77.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.77.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.77.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.78.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.78.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.78.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.78.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.78.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.78.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.79.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.79.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.79.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.79.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.79.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.79.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.8.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.8.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.8.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.8.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.8.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.8.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.80.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.80.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.80.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.80.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.80.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.80.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.81.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.81.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.81.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.81.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.81.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.81.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.82.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.82.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.82.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.82.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.82.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.82.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.83.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.83.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.83.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.83.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.83.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.83.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.84.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.84.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.84.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.84.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.84.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.84.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.85.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.85.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.85.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.85.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.85.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.85.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.86.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.86.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.86.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.86.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.86.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.86.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.87.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.87.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.87.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.87.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.87.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.87.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.88.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.88.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.88.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.88.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.88.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.88.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.89.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.89.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.89.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.89.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.89.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.89.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.9.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.9.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.9.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.9.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.9.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.9.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.90.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.90.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.90.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.90.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.90.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.90.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.91.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.91.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.91.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.91.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.91.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.91.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.92.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.92.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.92.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.92.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.92.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.92.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.93.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.93.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.93.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.93.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.93.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.93.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.94.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.94.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.94.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.94.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.94.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.94.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.95.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.95.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.95.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.95.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.95.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.95.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.96.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.96.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.96.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.96.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.96.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.96.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.97.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.97.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.97.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.97.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.97.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.97.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.98.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.98.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.98.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.98.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.98.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.98.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.99.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.99.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.99.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.99.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.99.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.experts.99.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.gate.e_score_correction_bias": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.gate.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.shared_experts.down_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.shared_experts.down_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.shared_experts.gate_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.shared_experts.gate_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.shared_experts.up_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.mlp.shared_experts.up_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.post_attention_layernorm.weight": "model-00021-of-00092.safetensors", + "model.layers.20.self_attn.k_norm.weight": "model-00021-of-00092.safetensors", + "model.layers.20.self_attn.k_proj.bias": "model-00021-of-00092.safetensors", + "model.layers.20.self_attn.k_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.self_attn.k_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.self_attn.o_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.self_attn.o_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.self_attn.q_norm.weight": "model-00021-of-00092.safetensors", + "model.layers.20.self_attn.q_proj.bias": "model-00021-of-00092.safetensors", + "model.layers.20.self_attn.q_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.self_attn.q_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.20.self_attn.v_proj.bias": "model-00021-of-00092.safetensors", + "model.layers.20.self_attn.v_proj.weight": "model-00021-of-00092.safetensors", + "model.layers.20.self_attn.v_proj.weight_scale": "model-00021-of-00092.safetensors", + "model.layers.21.input_layernorm.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.0.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.0.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.0.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.0.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.0.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.0.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.1.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.1.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.1.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.1.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.1.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.1.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.10.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.10.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.10.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.10.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.10.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.10.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.100.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.100.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.100.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.100.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.100.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.100.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.101.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.101.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.101.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.101.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.101.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.101.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.102.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.102.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.102.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.102.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.102.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.102.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.103.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.103.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.103.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.103.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.103.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.103.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.104.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.104.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.104.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.104.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.104.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.104.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.105.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.105.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.105.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.105.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.105.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.105.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.106.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.106.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.106.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.106.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.106.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.106.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.107.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.107.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.107.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.107.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.107.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.107.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.108.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.108.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.108.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.108.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.108.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.108.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.109.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.109.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.109.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.109.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.109.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.109.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.11.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.11.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.11.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.11.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.11.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.11.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.110.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.110.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.110.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.110.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.110.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.110.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.111.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.111.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.111.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.111.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.111.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.111.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.112.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.112.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.112.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.112.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.112.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.112.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.113.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.113.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.113.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.113.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.113.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.113.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.114.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.114.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.114.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.114.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.114.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.114.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.115.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.115.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.115.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.115.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.115.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.115.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.116.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.116.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.116.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.116.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.116.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.116.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.117.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.117.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.117.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.117.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.117.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.117.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.118.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.118.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.118.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.118.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.118.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.118.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.119.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.119.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.119.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.119.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.119.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.119.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.12.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.12.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.12.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.12.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.12.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.12.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.120.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.120.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.120.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.120.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.120.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.120.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.121.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.121.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.121.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.121.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.121.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.121.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.122.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.122.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.122.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.122.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.122.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.122.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.123.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.123.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.123.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.123.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.123.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.123.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.124.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.124.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.124.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.124.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.124.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.124.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.125.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.125.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.125.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.125.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.125.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.125.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.126.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.126.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.126.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.126.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.126.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.126.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.127.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.127.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.127.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.127.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.127.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.127.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.128.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.128.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.128.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.128.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.128.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.128.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.129.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.129.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.129.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.129.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.129.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.129.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.13.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.13.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.13.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.13.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.13.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.13.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.130.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.130.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.130.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.130.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.130.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.130.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.131.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.131.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.131.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.131.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.131.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.131.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.132.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.132.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.132.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.132.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.132.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.132.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.133.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.133.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.133.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.133.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.133.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.133.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.134.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.134.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.134.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.134.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.134.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.134.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.135.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.135.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.135.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.135.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.135.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.135.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.136.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.136.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.136.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.136.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.136.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.136.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.137.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.137.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.137.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.137.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.137.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.137.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.138.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.138.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.138.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.138.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.138.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.138.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.139.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.139.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.139.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.139.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.139.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.139.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.14.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.14.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.14.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.14.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.14.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.14.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.140.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.140.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.140.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.140.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.140.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.140.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.141.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.141.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.141.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.141.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.141.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.141.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.142.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.142.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.142.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.142.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.142.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.142.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.143.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.143.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.143.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.143.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.143.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.143.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.144.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.144.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.144.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.144.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.144.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.144.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.145.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.145.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.145.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.145.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.145.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.145.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.146.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.146.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.146.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.146.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.146.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.146.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.147.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.147.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.147.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.147.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.147.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.147.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.148.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.148.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.148.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.148.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.148.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.148.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.149.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.149.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.149.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.149.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.149.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.149.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.15.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.15.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.15.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.15.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.15.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.15.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.150.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.150.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.150.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.150.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.150.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.150.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.151.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.151.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.151.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.151.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.151.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.151.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.152.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.152.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.152.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.152.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.152.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.152.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.153.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.153.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.153.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.153.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.153.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.153.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.154.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.154.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.154.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.154.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.154.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.154.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.155.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.155.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.155.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.155.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.155.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.155.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.156.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.156.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.156.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.156.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.156.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.156.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.157.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.157.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.157.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.157.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.157.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.157.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.158.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.158.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.158.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.158.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.158.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.158.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.159.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.159.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.159.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.159.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.159.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.159.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.16.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.16.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.16.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.16.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.16.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.16.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.17.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.17.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.17.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.17.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.17.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.17.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.18.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.18.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.18.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.18.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.18.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.18.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.19.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.19.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.19.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.19.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.19.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.19.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.2.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.2.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.2.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.2.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.2.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.2.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.20.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.20.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.20.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.20.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.20.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.20.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.21.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.21.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.21.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.21.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.21.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.21.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.22.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.22.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.22.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.22.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.22.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.22.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.23.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.23.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.23.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.23.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.23.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.23.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.24.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.24.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.24.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.24.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.24.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.24.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.25.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.25.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.25.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.25.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.25.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.25.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.26.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.26.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.26.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.26.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.26.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.26.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.27.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.27.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.27.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.27.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.27.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.27.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.28.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.28.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.28.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.28.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.28.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.28.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.29.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.29.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.29.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.29.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.29.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.29.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.3.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.3.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.3.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.3.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.3.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.3.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.30.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.30.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.30.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.30.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.30.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.30.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.31.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.31.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.31.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.31.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.31.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.31.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.32.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.32.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.32.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.32.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.32.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.32.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.33.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.33.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.33.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.33.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.33.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.33.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.34.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.34.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.34.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.34.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.34.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.34.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.35.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.35.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.35.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.35.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.35.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.35.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.36.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.36.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.36.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.36.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.36.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.36.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.37.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.37.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.37.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.37.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.37.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.37.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.38.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.38.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.38.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.38.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.38.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.38.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.39.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.39.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.39.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.39.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.39.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.39.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.4.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.4.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.4.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.4.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.4.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.4.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.40.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.40.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.40.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.40.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.40.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.40.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.41.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.41.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.41.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.41.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.41.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.41.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.42.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.42.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.42.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.42.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.42.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.42.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.43.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.43.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.43.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.43.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.43.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.43.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.44.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.44.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.44.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.44.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.44.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.44.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.45.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.45.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.45.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.45.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.45.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.45.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.46.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.46.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.46.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.46.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.46.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.46.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.47.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.47.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.47.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.47.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.47.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.47.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.48.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.48.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.48.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.48.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.48.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.48.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.49.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.49.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.49.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.49.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.49.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.49.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.5.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.5.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.5.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.5.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.5.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.5.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.50.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.50.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.50.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.50.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.50.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.50.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.51.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.51.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.51.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.51.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.51.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.51.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.52.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.52.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.52.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.52.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.52.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.52.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.53.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.53.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.53.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.53.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.53.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.53.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.54.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.54.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.54.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.54.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.54.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.54.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.55.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.55.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.55.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.55.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.55.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.55.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.56.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.56.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.56.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.56.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.56.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.56.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.57.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.57.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.57.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.57.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.57.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.57.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.58.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.58.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.58.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.58.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.58.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.58.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.59.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.59.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.59.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.59.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.59.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.59.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.6.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.6.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.6.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.6.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.6.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.6.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.60.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.60.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.60.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.60.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.60.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.60.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.61.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.61.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.61.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.61.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.61.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.61.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.62.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.62.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.62.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.62.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.62.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.62.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.63.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.63.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.63.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.63.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.63.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.63.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.64.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.64.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.64.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.64.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.64.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.64.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.65.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.65.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.65.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.65.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.65.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.65.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.66.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.66.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.66.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.66.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.66.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.66.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.67.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.67.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.67.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.67.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.67.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.67.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.68.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.68.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.68.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.68.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.68.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.68.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.69.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.69.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.69.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.69.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.69.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.69.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.7.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.7.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.7.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.7.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.7.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.7.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.70.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.70.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.70.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.70.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.70.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.70.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.71.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.71.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.71.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.71.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.71.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.71.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.72.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.72.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.72.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.72.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.72.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.72.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.73.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.73.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.73.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.73.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.73.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.73.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.74.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.74.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.74.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.74.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.74.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.74.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.75.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.75.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.75.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.75.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.75.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.75.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.76.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.76.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.76.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.76.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.76.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.76.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.77.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.77.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.77.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.77.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.77.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.77.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.78.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.78.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.78.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.78.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.78.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.78.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.79.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.79.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.79.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.79.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.79.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.79.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.8.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.8.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.8.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.8.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.8.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.8.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.80.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.80.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.80.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.80.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.80.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.80.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.81.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.81.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.81.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.81.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.81.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.81.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.82.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.82.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.82.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.82.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.82.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.82.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.83.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.83.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.83.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.83.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.83.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.83.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.84.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.84.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.84.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.84.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.84.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.84.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.85.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.85.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.85.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.85.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.85.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.85.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.86.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.86.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.86.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.86.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.86.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.86.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.87.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.87.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.87.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.87.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.87.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.87.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.88.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.88.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.88.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.88.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.88.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.88.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.89.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.89.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.89.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.89.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.89.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.89.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.9.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.9.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.9.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.9.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.9.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.9.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.90.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.90.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.90.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.90.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.90.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.90.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.91.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.91.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.91.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.91.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.91.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.91.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.92.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.92.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.92.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.92.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.92.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.92.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.93.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.93.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.93.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.93.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.93.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.93.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.94.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.94.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.94.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.94.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.94.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.94.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.95.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.95.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.95.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.95.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.95.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.95.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.96.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.96.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.96.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.96.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.96.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.96.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.97.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.97.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.97.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.97.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.97.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.97.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.98.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.98.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.98.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.98.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.98.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.98.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.99.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.99.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.99.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.99.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.99.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.experts.99.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.gate.e_score_correction_bias": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.gate.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.shared_experts.down_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.shared_experts.down_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.shared_experts.gate_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.shared_experts.gate_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.shared_experts.up_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.mlp.shared_experts.up_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.post_attention_layernorm.weight": "model-00022-of-00092.safetensors", + "model.layers.21.self_attn.k_norm.weight": "model-00022-of-00092.safetensors", + "model.layers.21.self_attn.k_proj.bias": "model-00022-of-00092.safetensors", + "model.layers.21.self_attn.k_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.self_attn.k_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.self_attn.o_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.self_attn.o_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.self_attn.q_norm.weight": "model-00022-of-00092.safetensors", + "model.layers.21.self_attn.q_proj.bias": "model-00022-of-00092.safetensors", + "model.layers.21.self_attn.q_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.self_attn.q_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.21.self_attn.v_proj.bias": "model-00022-of-00092.safetensors", + "model.layers.21.self_attn.v_proj.weight": "model-00022-of-00092.safetensors", + "model.layers.21.self_attn.v_proj.weight_scale": "model-00022-of-00092.safetensors", + "model.layers.22.input_layernorm.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.0.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.0.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.0.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.0.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.0.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.0.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.1.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.1.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.1.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.1.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.1.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.1.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.10.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.10.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.10.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.10.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.10.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.10.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.100.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.100.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.100.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.100.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.100.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.100.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.101.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.101.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.101.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.101.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.101.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.101.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.102.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.102.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.102.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.102.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.102.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.102.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.103.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.103.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.103.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.103.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.103.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.103.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.104.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.104.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.104.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.104.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.104.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.104.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.105.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.105.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.105.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.105.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.105.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.105.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.106.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.106.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.106.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.106.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.106.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.106.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.107.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.107.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.107.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.107.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.107.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.107.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.108.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.108.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.108.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.108.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.108.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.108.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.109.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.109.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.109.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.109.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.109.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.109.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.11.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.11.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.11.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.11.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.11.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.11.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.110.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.110.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.110.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.110.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.110.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.110.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.111.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.111.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.111.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.111.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.111.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.111.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.112.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.112.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.112.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.112.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.112.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.112.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.113.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.113.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.113.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.113.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.113.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.113.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.114.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.114.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.114.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.114.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.114.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.114.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.115.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.115.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.115.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.115.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.115.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.115.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.116.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.116.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.116.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.116.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.116.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.116.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.117.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.117.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.117.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.117.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.117.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.117.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.118.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.118.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.118.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.118.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.118.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.118.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.119.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.119.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.119.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.119.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.119.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.119.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.12.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.12.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.12.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.12.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.12.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.12.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.120.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.120.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.120.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.120.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.120.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.120.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.121.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.121.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.121.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.121.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.121.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.121.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.122.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.122.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.122.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.122.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.122.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.122.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.123.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.123.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.123.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.123.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.123.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.123.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.124.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.124.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.124.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.124.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.124.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.124.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.125.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.125.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.125.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.125.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.125.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.125.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.126.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.126.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.126.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.126.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.126.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.126.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.127.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.127.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.127.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.127.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.127.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.127.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.128.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.128.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.128.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.128.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.128.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.128.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.129.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.129.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.129.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.129.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.129.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.129.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.13.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.13.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.13.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.13.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.13.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.13.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.130.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.130.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.130.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.130.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.130.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.130.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.131.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.131.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.131.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.131.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.131.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.131.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.132.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.132.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.132.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.132.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.132.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.132.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.133.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.133.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.133.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.133.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.133.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.133.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.134.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.134.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.134.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.134.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.134.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.134.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.135.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.135.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.135.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.135.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.135.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.135.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.136.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.136.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.136.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.136.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.136.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.136.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.137.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.137.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.137.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.137.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.137.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.137.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.138.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.138.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.138.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.138.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.138.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.138.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.139.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.139.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.139.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.139.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.139.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.139.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.14.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.14.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.14.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.14.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.14.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.14.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.140.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.140.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.140.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.140.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.140.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.140.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.141.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.141.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.141.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.141.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.141.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.141.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.142.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.142.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.142.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.142.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.142.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.142.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.143.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.143.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.143.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.143.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.143.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.143.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.144.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.144.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.144.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.144.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.144.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.144.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.145.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.145.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.145.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.145.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.145.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.145.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.146.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.146.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.146.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.146.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.146.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.146.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.147.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.147.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.147.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.147.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.147.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.147.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.148.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.148.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.148.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.148.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.148.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.148.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.149.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.149.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.149.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.149.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.149.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.149.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.15.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.15.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.15.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.15.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.15.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.15.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.150.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.150.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.150.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.150.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.150.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.150.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.151.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.151.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.151.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.151.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.151.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.151.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.152.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.152.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.152.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.152.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.152.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.152.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.153.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.153.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.153.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.153.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.153.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.153.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.154.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.154.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.154.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.154.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.154.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.154.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.155.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.155.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.155.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.155.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.155.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.155.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.156.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.156.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.156.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.156.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.156.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.156.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.157.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.157.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.157.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.157.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.157.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.157.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.158.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.158.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.158.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.158.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.158.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.158.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.159.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.159.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.159.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.159.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.159.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.159.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.16.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.16.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.16.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.16.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.16.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.16.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.17.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.17.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.17.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.17.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.17.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.17.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.18.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.18.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.18.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.18.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.18.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.18.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.19.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.19.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.19.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.19.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.19.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.19.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.2.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.2.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.2.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.2.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.2.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.2.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.20.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.20.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.20.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.20.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.20.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.20.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.21.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.21.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.21.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.21.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.21.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.21.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.22.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.22.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.22.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.22.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.22.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.22.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.23.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.23.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.23.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.23.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.23.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.23.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.24.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.24.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.24.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.24.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.24.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.24.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.25.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.25.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.25.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.25.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.25.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.25.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.26.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.26.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.26.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.26.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.26.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.26.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.27.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.27.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.27.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.27.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.27.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.27.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.28.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.28.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.28.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.28.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.28.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.28.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.29.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.29.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.29.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.29.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.29.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.29.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.3.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.3.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.3.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.3.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.3.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.3.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.30.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.30.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.30.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.30.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.30.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.30.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.31.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.31.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.31.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.31.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.31.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.31.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.32.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.32.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.32.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.32.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.32.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.32.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.33.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.33.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.33.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.33.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.33.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.33.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.34.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.34.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.34.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.34.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.34.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.34.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.35.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.35.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.35.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.35.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.35.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.35.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.36.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.36.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.36.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.36.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.36.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.36.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.37.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.37.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.37.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.37.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.37.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.37.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.38.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.38.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.38.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.38.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.38.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.38.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.39.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.39.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.39.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.39.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.39.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.39.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.4.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.4.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.4.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.4.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.4.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.4.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.40.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.40.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.40.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.40.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.40.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.40.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.41.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.41.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.41.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.41.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.41.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.41.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.42.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.42.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.42.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.42.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.42.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.42.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.43.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.43.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.43.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.43.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.43.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.43.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.44.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.44.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.44.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.44.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.44.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.44.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.45.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.45.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.45.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.45.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.45.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.45.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.46.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.46.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.46.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.46.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.46.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.46.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.47.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.47.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.47.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.47.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.47.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.47.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.48.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.48.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.48.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.48.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.48.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.48.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.49.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.49.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.49.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.49.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.49.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.49.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.5.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.5.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.5.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.5.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.5.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.5.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.50.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.50.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.50.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.50.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.50.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.50.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.51.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.51.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.51.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.51.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.51.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.51.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.52.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.52.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.52.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.52.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.52.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.52.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.53.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.53.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.53.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.53.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.53.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.53.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.54.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.54.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.54.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.54.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.54.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.54.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.55.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.55.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.55.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.55.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.55.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.55.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.56.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.56.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.56.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.56.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.56.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.56.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.57.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.57.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.57.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.57.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.57.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.57.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.58.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.58.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.58.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.58.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.58.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.58.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.59.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.59.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.59.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.59.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.59.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.59.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.6.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.6.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.6.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.6.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.6.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.6.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.60.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.60.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.60.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.60.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.60.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.60.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.61.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.61.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.61.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.61.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.61.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.61.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.62.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.62.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.62.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.62.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.62.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.62.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.63.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.63.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.63.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.63.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.63.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.63.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.64.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.64.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.64.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.64.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.64.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.64.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.65.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.65.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.65.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.65.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.65.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.65.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.66.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.66.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.66.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.66.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.66.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.66.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.67.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.67.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.67.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.67.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.67.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.67.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.68.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.68.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.68.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.68.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.68.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.68.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.69.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.69.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.69.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.69.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.69.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.69.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.7.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.7.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.7.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.7.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.7.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.7.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.70.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.70.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.70.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.70.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.70.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.70.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.71.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.71.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.71.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.71.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.71.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.71.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.72.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.72.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.72.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.72.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.72.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.72.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.73.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.73.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.73.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.73.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.73.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.73.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.74.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.74.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.74.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.74.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.74.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.74.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.75.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.75.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.75.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.75.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.75.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.75.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.76.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.76.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.76.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.76.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.76.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.76.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.77.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.77.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.77.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.77.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.77.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.77.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.78.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.78.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.78.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.78.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.78.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.78.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.79.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.79.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.79.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.79.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.79.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.79.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.8.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.8.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.8.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.8.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.8.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.8.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.80.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.80.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.80.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.80.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.80.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.80.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.81.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.81.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.81.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.81.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.81.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.81.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.82.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.82.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.82.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.82.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.82.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.82.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.83.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.83.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.83.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.83.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.83.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.83.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.84.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.84.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.84.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.84.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.84.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.84.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.85.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.85.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.85.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.85.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.85.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.85.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.86.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.86.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.86.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.86.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.86.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.86.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.87.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.87.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.87.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.87.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.87.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.87.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.88.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.88.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.88.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.88.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.88.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.88.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.89.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.89.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.89.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.89.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.89.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.89.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.9.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.9.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.9.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.9.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.9.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.9.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.90.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.90.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.90.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.90.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.90.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.90.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.91.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.91.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.91.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.91.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.91.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.91.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.92.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.92.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.92.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.92.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.92.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.92.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.93.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.93.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.93.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.93.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.93.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.93.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.94.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.94.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.94.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.94.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.94.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.94.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.95.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.95.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.95.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.95.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.95.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.95.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.96.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.96.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.96.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.96.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.96.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.96.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.97.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.97.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.97.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.97.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.97.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.97.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.98.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.98.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.98.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.98.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.98.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.98.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.99.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.99.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.99.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.99.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.99.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.experts.99.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.gate.e_score_correction_bias": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.gate.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.shared_experts.down_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.shared_experts.down_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.shared_experts.gate_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.shared_experts.gate_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.shared_experts.up_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.mlp.shared_experts.up_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.post_attention_layernorm.weight": "model-00023-of-00092.safetensors", + "model.layers.22.self_attn.k_norm.weight": "model-00023-of-00092.safetensors", + "model.layers.22.self_attn.k_proj.bias": "model-00023-of-00092.safetensors", + "model.layers.22.self_attn.k_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.self_attn.k_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.self_attn.o_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.self_attn.o_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.self_attn.q_norm.weight": "model-00023-of-00092.safetensors", + "model.layers.22.self_attn.q_proj.bias": "model-00023-of-00092.safetensors", + "model.layers.22.self_attn.q_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.self_attn.q_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.22.self_attn.v_proj.bias": "model-00023-of-00092.safetensors", + "model.layers.22.self_attn.v_proj.weight": "model-00023-of-00092.safetensors", + "model.layers.22.self_attn.v_proj.weight_scale": "model-00023-of-00092.safetensors", + "model.layers.23.input_layernorm.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.0.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.0.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.0.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.0.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.0.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.0.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.1.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.1.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.1.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.1.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.1.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.1.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.10.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.10.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.10.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.10.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.10.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.10.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.100.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.100.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.100.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.100.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.100.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.100.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.101.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.101.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.101.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.101.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.101.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.101.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.102.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.102.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.102.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.102.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.102.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.102.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.103.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.103.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.103.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.103.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.103.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.103.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.104.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.104.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.104.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.104.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.104.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.104.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.105.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.105.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.105.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.105.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.105.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.105.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.106.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.106.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.106.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.106.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.106.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.106.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.107.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.107.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.107.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.107.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.107.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.107.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.108.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.108.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.108.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.108.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.108.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.108.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.109.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.109.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.109.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.109.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.109.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.109.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.11.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.11.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.11.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.11.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.11.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.11.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.110.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.110.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.110.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.110.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.110.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.110.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.111.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.111.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.111.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.111.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.111.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.111.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.112.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.112.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.112.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.112.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.112.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.112.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.113.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.113.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.113.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.113.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.113.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.113.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.114.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.114.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.114.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.114.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.114.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.114.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.115.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.115.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.115.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.115.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.115.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.115.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.116.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.116.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.116.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.116.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.116.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.116.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.117.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.117.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.117.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.117.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.117.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.117.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.118.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.118.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.118.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.118.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.118.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.118.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.119.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.119.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.119.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.119.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.119.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.119.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.12.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.12.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.12.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.12.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.12.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.12.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.120.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.120.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.120.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.120.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.120.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.120.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.121.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.121.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.121.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.121.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.121.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.121.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.122.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.122.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.122.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.122.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.122.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.122.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.123.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.123.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.123.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.123.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.123.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.123.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.124.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.124.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.124.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.124.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.124.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.124.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.125.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.125.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.125.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.125.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.125.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.125.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.126.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.126.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.126.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.126.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.126.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.126.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.127.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.127.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.127.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.127.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.127.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.127.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.128.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.128.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.128.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.128.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.128.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.128.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.129.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.129.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.129.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.129.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.129.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.129.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.13.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.13.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.13.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.13.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.13.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.13.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.130.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.130.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.130.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.130.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.130.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.130.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.131.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.131.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.131.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.131.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.131.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.131.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.132.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.132.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.132.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.132.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.132.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.132.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.133.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.133.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.133.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.133.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.133.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.133.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.134.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.134.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.134.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.134.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.134.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.134.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.135.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.135.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.135.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.135.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.135.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.135.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.136.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.136.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.136.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.136.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.136.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.136.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.137.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.137.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.137.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.137.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.137.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.137.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.138.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.138.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.138.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.138.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.138.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.138.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.139.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.139.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.139.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.139.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.139.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.139.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.14.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.14.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.14.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.14.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.14.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.14.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.140.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.140.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.140.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.140.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.140.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.140.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.141.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.141.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.141.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.141.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.141.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.141.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.142.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.142.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.142.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.142.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.142.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.142.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.143.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.143.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.143.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.143.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.143.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.143.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.144.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.144.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.144.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.144.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.144.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.144.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.145.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.145.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.145.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.145.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.145.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.145.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.146.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.146.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.146.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.146.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.146.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.146.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.147.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.147.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.147.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.147.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.147.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.147.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.148.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.148.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.148.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.148.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.148.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.148.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.149.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.149.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.149.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.149.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.149.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.149.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.15.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.15.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.15.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.15.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.15.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.15.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.150.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.150.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.150.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.150.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.150.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.150.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.151.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.151.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.151.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.151.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.151.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.151.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.152.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.152.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.152.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.152.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.152.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.152.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.153.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.153.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.153.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.153.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.153.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.153.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.154.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.154.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.154.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.154.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.154.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.154.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.155.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.155.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.155.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.155.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.155.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.155.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.156.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.156.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.156.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.156.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.156.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.156.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.157.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.157.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.157.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.157.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.157.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.157.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.158.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.158.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.158.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.158.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.158.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.158.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.159.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.159.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.159.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.159.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.159.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.159.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.16.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.16.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.16.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.16.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.16.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.16.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.17.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.17.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.17.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.17.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.17.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.17.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.18.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.18.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.18.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.18.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.18.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.18.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.19.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.19.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.19.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.19.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.19.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.19.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.2.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.2.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.2.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.2.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.2.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.2.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.20.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.20.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.20.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.20.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.20.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.20.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.21.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.21.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.21.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.21.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.21.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.21.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.22.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.22.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.22.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.22.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.22.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.22.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.23.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.23.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.23.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.23.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.23.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.23.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.24.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.24.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.24.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.24.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.24.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.24.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.25.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.25.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.25.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.25.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.25.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.25.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.26.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.26.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.26.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.26.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.26.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.26.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.27.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.27.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.27.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.27.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.27.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.27.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.28.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.28.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.28.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.28.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.28.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.28.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.29.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.29.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.29.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.29.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.29.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.29.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.3.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.3.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.3.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.3.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.3.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.3.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.30.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.30.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.30.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.30.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.30.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.30.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.31.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.31.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.31.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.31.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.31.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.31.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.32.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.32.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.32.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.32.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.32.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.32.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.33.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.33.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.33.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.33.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.33.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.33.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.34.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.34.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.34.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.34.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.34.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.34.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.35.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.35.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.35.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.35.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.35.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.35.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.36.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.36.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.36.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.36.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.36.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.36.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.37.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.37.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.37.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.37.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.37.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.37.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.38.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.38.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.38.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.38.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.38.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.38.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.39.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.39.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.39.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.39.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.39.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.39.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.4.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.4.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.4.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.4.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.4.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.4.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.40.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.40.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.40.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.40.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.40.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.40.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.41.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.41.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.41.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.41.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.41.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.41.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.42.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.42.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.42.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.42.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.42.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.42.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.43.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.43.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.43.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.43.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.43.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.43.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.44.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.44.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.44.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.44.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.44.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.44.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.45.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.45.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.45.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.45.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.45.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.45.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.46.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.46.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.46.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.46.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.46.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.46.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.47.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.47.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.47.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.47.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.47.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.47.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.48.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.48.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.48.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.48.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.48.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.48.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.49.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.49.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.49.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.49.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.49.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.49.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.5.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.5.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.5.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.5.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.5.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.5.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.50.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.50.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.50.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.50.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.50.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.50.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.51.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.51.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.51.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.51.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.51.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.51.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.52.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.52.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.52.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.52.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.52.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.52.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.53.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.53.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.53.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.53.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.53.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.53.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.54.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.54.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.54.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.54.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.54.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.54.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.55.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.55.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.55.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.55.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.55.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.55.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.56.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.56.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.56.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.56.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.56.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.56.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.57.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.57.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.57.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.57.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.57.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.57.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.58.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.58.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.58.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.58.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.58.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.58.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.59.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.59.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.59.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.59.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.59.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.59.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.6.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.6.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.6.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.6.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.6.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.6.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.60.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.60.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.60.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.60.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.60.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.60.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.61.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.61.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.61.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.61.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.61.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.61.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.62.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.62.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.62.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.62.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.62.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.62.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.63.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.63.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.63.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.63.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.63.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.63.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.64.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.64.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.64.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.64.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.64.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.64.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.65.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.65.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.65.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.65.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.65.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.65.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.66.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.66.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.66.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.66.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.66.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.66.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.67.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.67.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.67.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.67.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.67.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.67.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.68.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.68.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.68.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.68.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.68.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.68.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.69.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.69.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.69.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.69.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.69.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.69.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.7.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.7.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.7.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.7.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.7.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.7.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.70.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.70.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.70.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.70.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.70.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.70.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.71.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.71.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.71.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.71.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.71.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.71.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.72.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.72.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.72.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.72.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.72.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.72.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.73.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.73.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.73.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.73.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.73.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.73.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.74.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.74.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.74.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.74.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.74.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.74.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.75.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.75.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.75.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.75.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.75.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.75.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.76.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.76.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.76.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.76.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.76.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.76.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.77.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.77.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.77.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.77.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.77.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.77.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.78.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.78.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.78.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.78.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.78.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.78.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.79.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.79.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.79.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.79.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.79.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.79.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.8.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.8.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.8.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.8.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.8.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.8.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.80.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.80.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.80.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.80.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.80.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.80.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.81.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.81.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.81.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.81.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.81.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.81.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.82.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.82.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.82.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.82.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.82.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.82.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.83.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.83.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.83.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.83.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.83.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.83.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.84.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.84.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.84.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.84.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.84.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.84.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.85.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.85.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.85.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.85.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.85.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.85.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.86.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.86.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.86.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.86.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.86.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.86.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.87.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.87.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.87.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.87.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.87.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.87.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.88.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.88.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.88.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.88.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.88.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.88.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.89.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.89.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.89.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.89.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.89.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.89.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.9.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.9.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.9.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.9.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.9.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.9.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.90.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.90.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.90.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.90.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.90.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.90.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.91.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.91.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.91.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.91.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.91.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.91.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.92.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.92.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.92.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.92.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.92.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.92.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.93.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.93.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.93.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.93.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.93.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.93.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.94.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.94.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.94.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.94.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.94.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.94.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.95.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.95.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.95.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.95.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.95.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.95.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.96.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.96.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.96.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.96.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.96.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.96.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.97.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.97.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.97.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.97.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.97.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.97.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.98.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.98.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.98.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.98.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.98.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.98.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.99.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.99.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.99.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.99.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.99.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.experts.99.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.gate.e_score_correction_bias": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.gate.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.shared_experts.down_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.shared_experts.down_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.shared_experts.gate_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.shared_experts.gate_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.shared_experts.up_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.mlp.shared_experts.up_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.post_attention_layernorm.weight": "model-00024-of-00092.safetensors", + "model.layers.23.self_attn.k_norm.weight": "model-00024-of-00092.safetensors", + "model.layers.23.self_attn.k_proj.bias": "model-00024-of-00092.safetensors", + "model.layers.23.self_attn.k_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.self_attn.k_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.self_attn.o_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.self_attn.o_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.self_attn.q_norm.weight": "model-00024-of-00092.safetensors", + "model.layers.23.self_attn.q_proj.bias": "model-00024-of-00092.safetensors", + "model.layers.23.self_attn.q_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.self_attn.q_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.23.self_attn.v_proj.bias": "model-00024-of-00092.safetensors", + "model.layers.23.self_attn.v_proj.weight": "model-00024-of-00092.safetensors", + "model.layers.23.self_attn.v_proj.weight_scale": "model-00024-of-00092.safetensors", + "model.layers.24.input_layernorm.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.0.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.0.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.0.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.0.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.0.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.0.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.1.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.1.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.1.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.1.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.1.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.1.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.10.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.10.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.10.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.10.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.10.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.10.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.100.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.100.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.100.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.100.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.100.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.100.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.101.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.101.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.101.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.101.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.101.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.101.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.102.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.102.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.102.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.102.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.102.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.102.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.103.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.103.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.103.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.103.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.103.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.103.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.104.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.104.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.104.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.104.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.104.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.104.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.105.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.105.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.105.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.105.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.105.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.105.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.106.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.106.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.106.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.106.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.106.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.106.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.107.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.107.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.107.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.107.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.107.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.107.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.108.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.108.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.108.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.108.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.108.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.108.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.109.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.109.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.109.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.109.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.109.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.109.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.11.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.11.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.11.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.11.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.11.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.11.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.110.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.110.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.110.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.110.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.110.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.110.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.111.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.111.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.111.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.111.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.111.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.111.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.112.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.112.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.112.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.112.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.112.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.112.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.113.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.113.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.113.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.113.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.113.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.113.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.114.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.114.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.114.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.114.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.114.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.114.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.115.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.115.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.115.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.115.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.115.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.115.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.116.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.116.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.116.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.116.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.116.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.116.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.117.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.117.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.117.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.117.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.117.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.117.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.118.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.118.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.118.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.118.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.118.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.118.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.119.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.119.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.119.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.119.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.119.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.119.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.12.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.12.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.12.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.12.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.12.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.12.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.120.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.120.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.120.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.120.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.120.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.120.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.121.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.121.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.121.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.121.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.121.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.121.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.122.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.122.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.122.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.122.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.122.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.122.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.123.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.123.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.123.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.123.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.123.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.123.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.124.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.124.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.124.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.124.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.124.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.124.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.125.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.125.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.125.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.125.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.125.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.125.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.126.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.126.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.126.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.126.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.126.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.126.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.127.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.127.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.127.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.127.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.127.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.127.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.128.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.128.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.128.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.128.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.128.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.128.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.129.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.129.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.129.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.129.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.129.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.129.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.13.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.13.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.13.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.13.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.13.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.13.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.130.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.130.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.130.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.130.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.130.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.130.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.131.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.131.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.131.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.131.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.131.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.131.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.132.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.132.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.132.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.132.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.132.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.132.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.133.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.133.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.133.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.133.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.133.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.133.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.134.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.134.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.134.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.134.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.134.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.134.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.135.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.135.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.135.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.135.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.135.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.135.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.136.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.136.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.136.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.136.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.136.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.136.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.137.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.137.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.137.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.137.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.137.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.137.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.138.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.138.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.138.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.138.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.138.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.138.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.139.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.139.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.139.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.139.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.139.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.139.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.14.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.14.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.14.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.14.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.14.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.14.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.140.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.140.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.140.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.140.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.140.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.140.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.141.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.141.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.141.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.141.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.141.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.141.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.142.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.142.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.142.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.142.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.142.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.142.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.143.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.143.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.143.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.143.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.143.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.143.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.144.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.144.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.144.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.144.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.144.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.144.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.145.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.145.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.145.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.145.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.145.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.145.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.146.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.146.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.146.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.146.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.146.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.146.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.147.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.147.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.147.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.147.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.147.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.147.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.148.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.148.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.148.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.148.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.148.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.148.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.149.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.149.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.149.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.149.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.149.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.149.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.15.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.15.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.15.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.15.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.15.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.15.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.150.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.150.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.150.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.150.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.150.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.150.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.151.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.151.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.151.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.151.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.151.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.151.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.152.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.152.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.152.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.152.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.152.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.152.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.153.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.153.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.153.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.153.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.153.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.153.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.154.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.154.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.154.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.154.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.154.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.154.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.155.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.155.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.155.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.155.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.155.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.155.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.156.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.156.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.156.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.156.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.156.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.156.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.157.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.157.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.157.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.157.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.157.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.157.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.158.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.158.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.158.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.158.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.158.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.158.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.159.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.159.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.159.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.159.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.159.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.159.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.16.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.16.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.16.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.16.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.16.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.16.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.17.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.17.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.17.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.17.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.17.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.17.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.18.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.18.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.18.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.18.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.18.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.18.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.19.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.19.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.19.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.19.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.19.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.19.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.2.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.2.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.2.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.2.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.2.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.2.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.20.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.20.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.20.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.20.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.20.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.20.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.21.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.21.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.21.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.21.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.21.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.21.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.22.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.22.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.22.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.22.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.22.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.22.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.23.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.23.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.23.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.23.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.23.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.23.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.24.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.24.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.24.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.24.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.24.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.24.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.25.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.25.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.25.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.25.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.25.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.25.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.26.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.26.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.26.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.26.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.26.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.26.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.27.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.27.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.27.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.27.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.27.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.27.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.28.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.28.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.28.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.28.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.28.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.28.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.29.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.29.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.29.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.29.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.29.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.29.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.3.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.3.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.3.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.3.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.3.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.3.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.30.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.30.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.30.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.30.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.30.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.30.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.31.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.31.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.31.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.31.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.31.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.31.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.32.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.32.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.32.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.32.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.32.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.32.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.33.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.33.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.33.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.33.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.33.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.33.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.34.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.34.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.34.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.34.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.34.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.34.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.35.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.35.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.35.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.35.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.35.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.35.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.36.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.36.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.36.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.36.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.36.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.36.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.37.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.37.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.37.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.37.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.37.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.37.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.38.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.38.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.38.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.38.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.38.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.38.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.39.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.39.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.39.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.39.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.39.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.39.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.4.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.4.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.4.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.4.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.4.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.4.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.40.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.40.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.40.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.40.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.40.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.40.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.41.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.41.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.41.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.41.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.41.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.41.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.42.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.42.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.42.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.42.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.42.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.42.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.43.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.43.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.43.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.43.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.43.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.43.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.44.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.44.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.44.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.44.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.44.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.44.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.45.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.45.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.45.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.45.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.45.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.45.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.46.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.46.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.46.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.46.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.46.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.46.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.47.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.47.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.47.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.47.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.47.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.47.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.48.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.48.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.48.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.48.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.48.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.48.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.49.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.49.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.49.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.49.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.49.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.49.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.5.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.5.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.5.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.5.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.5.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.5.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.50.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.50.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.50.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.50.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.50.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.50.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.51.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.51.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.51.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.51.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.51.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.51.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.52.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.52.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.52.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.52.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.52.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.52.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.53.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.53.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.53.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.53.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.53.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.53.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.54.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.54.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.54.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.54.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.54.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.54.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.55.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.55.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.55.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.55.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.55.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.55.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.56.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.56.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.56.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.56.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.56.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.56.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.57.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.57.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.57.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.57.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.57.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.57.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.58.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.58.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.58.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.58.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.58.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.58.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.59.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.59.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.59.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.59.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.59.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.59.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.6.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.6.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.6.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.6.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.6.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.6.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.60.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.60.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.60.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.60.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.60.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.60.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.61.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.61.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.61.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.61.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.61.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.61.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.62.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.62.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.62.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.62.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.62.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.62.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.63.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.63.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.63.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.63.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.63.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.63.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.64.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.64.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.64.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.64.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.64.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.64.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.65.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.65.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.65.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.65.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.65.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.65.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.66.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.66.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.66.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.66.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.66.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.66.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.67.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.67.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.67.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.67.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.67.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.67.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.68.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.68.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.68.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.68.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.68.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.68.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.69.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.69.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.69.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.69.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.69.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.69.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.7.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.7.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.7.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.7.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.7.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.7.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.70.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.70.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.70.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.70.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.70.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.70.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.71.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.71.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.71.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.71.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.71.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.71.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.72.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.72.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.72.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.72.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.72.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.72.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.73.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.73.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.73.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.73.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.73.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.73.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.74.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.74.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.74.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.74.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.74.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.74.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.75.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.75.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.75.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.75.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.75.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.75.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.76.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.76.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.76.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.76.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.76.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.76.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.77.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.77.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.77.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.77.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.77.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.77.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.78.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.78.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.78.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.78.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.78.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.78.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.79.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.79.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.79.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.79.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.79.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.79.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.8.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.8.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.8.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.8.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.8.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.8.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.80.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.80.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.80.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.80.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.80.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.80.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.81.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.81.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.81.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.81.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.81.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.81.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.82.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.82.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.82.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.82.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.82.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.82.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.83.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.83.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.83.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.83.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.83.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.83.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.84.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.84.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.84.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.84.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.84.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.84.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.85.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.85.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.85.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.85.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.85.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.85.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.86.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.86.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.86.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.86.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.86.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.86.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.87.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.87.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.87.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.87.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.87.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.87.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.88.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.88.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.88.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.88.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.88.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.88.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.89.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.89.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.89.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.89.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.89.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.89.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.9.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.9.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.9.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.9.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.9.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.9.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.90.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.90.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.90.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.90.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.90.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.90.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.91.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.91.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.91.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.91.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.91.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.91.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.92.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.92.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.92.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.92.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.92.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.92.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.93.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.93.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.93.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.93.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.93.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.93.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.94.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.94.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.94.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.94.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.94.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.94.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.95.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.95.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.95.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.95.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.95.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.95.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.96.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.96.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.96.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.96.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.96.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.96.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.97.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.97.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.97.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.97.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.97.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.97.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.98.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.98.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.98.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.98.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.98.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.98.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.99.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.99.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.99.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.99.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.99.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.experts.99.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.gate.e_score_correction_bias": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.gate.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.shared_experts.down_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.shared_experts.down_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.shared_experts.gate_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.shared_experts.gate_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.shared_experts.up_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.mlp.shared_experts.up_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.post_attention_layernorm.weight": "model-00025-of-00092.safetensors", + "model.layers.24.self_attn.k_norm.weight": "model-00025-of-00092.safetensors", + "model.layers.24.self_attn.k_proj.bias": "model-00025-of-00092.safetensors", + "model.layers.24.self_attn.k_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.self_attn.k_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.self_attn.o_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.self_attn.o_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.self_attn.q_norm.weight": "model-00025-of-00092.safetensors", + "model.layers.24.self_attn.q_proj.bias": "model-00025-of-00092.safetensors", + "model.layers.24.self_attn.q_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.self_attn.q_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.24.self_attn.v_proj.bias": "model-00025-of-00092.safetensors", + "model.layers.24.self_attn.v_proj.weight": "model-00025-of-00092.safetensors", + "model.layers.24.self_attn.v_proj.weight_scale": "model-00025-of-00092.safetensors", + "model.layers.25.input_layernorm.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.0.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.0.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.0.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.0.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.0.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.0.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.1.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.1.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.1.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.1.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.1.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.1.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.10.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.10.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.10.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.10.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.10.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.10.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.100.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.100.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.100.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.100.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.100.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.100.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.101.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.101.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.101.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.101.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.101.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.101.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.102.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.102.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.102.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.102.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.102.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.102.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.103.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.103.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.103.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.103.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.103.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.103.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.104.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.104.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.104.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.104.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.104.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.104.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.105.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.105.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.105.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.105.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.105.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.105.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.106.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.106.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.106.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.106.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.106.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.106.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.107.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.107.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.107.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.107.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.107.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.107.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.108.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.108.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.108.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.108.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.108.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.108.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.109.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.109.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.109.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.109.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.109.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.109.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.11.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.11.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.11.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.11.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.11.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.11.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.110.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.110.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.110.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.110.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.110.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.110.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.111.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.111.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.111.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.111.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.111.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.111.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.112.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.112.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.112.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.112.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.112.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.112.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.113.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.113.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.113.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.113.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.113.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.113.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.114.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.114.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.114.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.114.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.114.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.114.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.115.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.115.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.115.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.115.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.115.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.115.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.116.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.116.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.116.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.116.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.116.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.116.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.117.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.117.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.117.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.117.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.117.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.117.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.118.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.118.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.118.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.118.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.118.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.118.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.119.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.119.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.119.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.119.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.119.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.119.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.12.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.12.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.12.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.12.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.12.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.12.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.120.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.120.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.120.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.120.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.120.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.120.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.121.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.121.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.121.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.121.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.121.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.121.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.122.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.122.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.122.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.122.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.122.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.122.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.123.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.123.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.123.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.123.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.123.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.123.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.124.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.124.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.124.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.124.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.124.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.124.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.125.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.125.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.125.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.125.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.125.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.125.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.126.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.126.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.126.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.126.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.126.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.126.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.127.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.127.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.127.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.127.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.127.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.127.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.128.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.128.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.128.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.128.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.128.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.128.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.129.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.129.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.129.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.129.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.129.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.129.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.13.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.13.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.13.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.13.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.13.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.13.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.130.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.130.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.130.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.130.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.130.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.130.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.131.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.131.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.131.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.131.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.131.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.131.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.132.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.132.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.132.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.132.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.132.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.132.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.133.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.133.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.133.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.133.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.133.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.133.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.134.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.134.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.134.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.134.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.134.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.134.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.135.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.135.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.135.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.135.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.135.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.135.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.136.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.136.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.136.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.136.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.136.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.136.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.137.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.137.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.137.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.137.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.137.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.137.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.138.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.138.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.138.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.138.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.138.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.138.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.139.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.139.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.139.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.139.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.139.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.139.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.14.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.14.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.14.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.14.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.14.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.14.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.140.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.140.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.140.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.140.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.140.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.140.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.141.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.141.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.141.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.141.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.141.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.141.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.142.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.142.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.142.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.142.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.142.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.142.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.143.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.143.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.143.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.143.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.143.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.143.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.144.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.144.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.144.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.144.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.144.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.144.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.145.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.145.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.145.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.145.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.145.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.145.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.146.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.146.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.146.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.146.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.146.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.146.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.147.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.147.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.147.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.147.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.147.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.147.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.148.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.148.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.148.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.148.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.148.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.148.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.149.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.149.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.149.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.149.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.149.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.149.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.15.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.15.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.15.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.15.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.15.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.15.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.150.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.150.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.150.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.150.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.150.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.150.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.151.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.151.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.151.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.151.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.151.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.151.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.152.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.152.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.152.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.152.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.152.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.152.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.153.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.153.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.153.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.153.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.153.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.153.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.154.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.154.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.154.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.154.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.154.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.154.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.155.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.155.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.155.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.155.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.155.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.155.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.156.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.156.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.156.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.156.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.156.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.156.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.157.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.157.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.157.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.157.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.157.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.157.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.158.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.158.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.158.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.158.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.158.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.158.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.159.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.159.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.159.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.159.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.159.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.159.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.16.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.16.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.16.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.16.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.16.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.16.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.17.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.17.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.17.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.17.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.17.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.17.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.18.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.18.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.18.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.18.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.18.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.18.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.19.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.19.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.19.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.19.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.19.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.19.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.2.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.2.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.2.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.2.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.2.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.2.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.20.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.20.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.20.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.20.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.20.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.20.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.21.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.21.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.21.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.21.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.21.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.21.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.22.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.22.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.22.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.22.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.22.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.22.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.23.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.23.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.23.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.23.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.23.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.23.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.24.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.24.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.24.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.24.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.24.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.24.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.25.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.25.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.25.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.25.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.25.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.25.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.26.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.26.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.26.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.26.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.26.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.26.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.27.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.27.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.27.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.27.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.27.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.27.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.28.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.28.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.28.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.28.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.28.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.28.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.29.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.29.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.29.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.29.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.29.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.29.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.3.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.3.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.3.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.3.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.3.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.3.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.30.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.30.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.30.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.30.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.30.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.30.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.31.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.31.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.31.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.31.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.31.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.31.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.32.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.32.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.32.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.32.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.32.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.32.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.33.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.33.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.33.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.33.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.33.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.33.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.34.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.34.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.34.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.34.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.34.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.34.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.35.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.35.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.35.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.35.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.35.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.35.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.36.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.36.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.36.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.36.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.36.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.36.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.37.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.37.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.37.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.37.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.37.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.37.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.38.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.38.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.38.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.38.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.38.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.38.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.39.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.39.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.39.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.39.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.39.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.39.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.4.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.4.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.4.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.4.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.4.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.4.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.40.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.40.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.40.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.40.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.40.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.40.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.41.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.41.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.41.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.41.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.41.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.41.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.42.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.42.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.42.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.42.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.42.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.42.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.43.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.43.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.43.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.43.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.43.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.43.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.44.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.44.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.44.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.44.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.44.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.44.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.45.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.45.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.45.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.45.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.45.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.45.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.46.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.46.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.46.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.46.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.46.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.46.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.47.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.47.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.47.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.47.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.47.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.47.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.48.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.48.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.48.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.48.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.48.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.48.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.49.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.49.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.49.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.49.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.49.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.49.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.5.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.5.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.5.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.5.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.5.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.5.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.50.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.50.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.50.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.50.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.50.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.50.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.51.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.51.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.51.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.51.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.51.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.51.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.52.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.52.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.52.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.52.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.52.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.52.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.53.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.53.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.53.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.53.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.53.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.53.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.54.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.54.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.54.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.54.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.54.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.54.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.55.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.55.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.55.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.55.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.55.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.55.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.56.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.56.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.56.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.56.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.56.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.56.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.57.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.57.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.57.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.57.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.57.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.57.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.58.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.58.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.58.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.58.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.58.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.58.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.59.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.59.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.59.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.59.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.59.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.59.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.6.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.6.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.6.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.6.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.6.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.6.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.60.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.60.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.60.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.60.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.60.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.60.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.61.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.61.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.61.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.61.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.61.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.61.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.62.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.62.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.62.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.62.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.62.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.62.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.63.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.63.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.63.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.63.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.63.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.63.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.64.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.64.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.64.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.64.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.64.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.64.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.65.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.65.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.65.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.65.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.65.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.65.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.66.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.66.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.66.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.66.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.66.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.66.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.67.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.67.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.67.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.67.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.67.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.67.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.68.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.68.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.68.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.68.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.68.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.68.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.69.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.69.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.69.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.69.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.69.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.69.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.7.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.7.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.7.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.7.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.7.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.7.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.70.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.70.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.70.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.70.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.70.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.70.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.71.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.71.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.71.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.71.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.71.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.71.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.72.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.72.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.72.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.72.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.72.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.72.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.73.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.73.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.73.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.73.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.73.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.73.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.74.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.74.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.74.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.74.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.74.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.74.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.75.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.75.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.75.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.75.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.75.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.75.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.76.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.76.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.76.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.76.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.76.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.76.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.77.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.77.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.77.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.77.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.77.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.77.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.78.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.78.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.78.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.78.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.78.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.78.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.79.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.79.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.79.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.79.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.79.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.79.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.8.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.8.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.8.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.8.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.8.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.8.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.80.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.80.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.80.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.80.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.80.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.80.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.81.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.81.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.81.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.81.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.81.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.81.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.82.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.82.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.82.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.82.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.82.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.82.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.83.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.83.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.83.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.83.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.83.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.83.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.84.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.84.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.84.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.84.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.84.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.84.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.85.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.85.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.85.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.85.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.85.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.85.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.86.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.86.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.86.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.86.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.86.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.86.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.87.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.87.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.87.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.87.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.87.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.87.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.88.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.88.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.88.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.88.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.88.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.88.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.89.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.89.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.89.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.89.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.89.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.89.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.9.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.9.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.9.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.9.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.9.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.9.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.90.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.90.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.90.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.90.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.90.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.90.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.91.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.91.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.91.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.91.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.91.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.91.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.92.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.92.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.92.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.92.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.92.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.92.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.93.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.93.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.93.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.93.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.93.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.93.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.94.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.94.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.94.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.94.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.94.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.94.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.95.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.95.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.95.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.95.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.95.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.95.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.96.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.96.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.96.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.96.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.96.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.96.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.97.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.97.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.97.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.97.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.97.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.97.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.98.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.98.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.98.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.98.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.98.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.98.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.99.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.99.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.99.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.99.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.99.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.experts.99.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.gate.e_score_correction_bias": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.gate.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.shared_experts.down_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.shared_experts.down_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.shared_experts.gate_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.shared_experts.gate_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.shared_experts.up_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.mlp.shared_experts.up_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.post_attention_layernorm.weight": "model-00026-of-00092.safetensors", + "model.layers.25.self_attn.k_norm.weight": "model-00026-of-00092.safetensors", + "model.layers.25.self_attn.k_proj.bias": "model-00026-of-00092.safetensors", + "model.layers.25.self_attn.k_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.self_attn.k_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.self_attn.o_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.self_attn.o_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.self_attn.q_norm.weight": "model-00026-of-00092.safetensors", + "model.layers.25.self_attn.q_proj.bias": "model-00026-of-00092.safetensors", + "model.layers.25.self_attn.q_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.self_attn.q_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.25.self_attn.v_proj.bias": "model-00026-of-00092.safetensors", + "model.layers.25.self_attn.v_proj.weight": "model-00026-of-00092.safetensors", + "model.layers.25.self_attn.v_proj.weight_scale": "model-00026-of-00092.safetensors", + "model.layers.26.input_layernorm.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.0.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.0.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.0.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.0.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.0.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.0.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.1.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.1.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.1.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.1.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.1.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.1.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.10.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.10.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.10.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.10.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.10.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.10.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.100.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.100.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.100.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.100.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.100.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.100.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.101.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.101.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.101.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.101.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.101.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.101.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.102.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.102.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.102.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.102.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.102.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.102.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.103.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.103.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.103.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.103.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.103.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.103.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.104.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.104.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.104.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.104.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.104.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.104.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.105.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.105.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.105.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.105.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.105.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.105.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.106.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.106.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.106.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.106.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.106.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.106.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.107.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.107.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.107.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.107.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.107.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.107.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.108.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.108.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.108.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.108.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.108.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.108.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.109.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.109.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.109.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.109.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.109.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.109.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.11.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.11.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.11.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.11.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.11.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.11.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.110.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.110.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.110.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.110.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.110.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.110.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.111.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.111.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.111.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.111.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.111.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.111.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.112.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.112.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.112.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.112.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.112.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.112.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.113.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.113.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.113.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.113.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.113.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.113.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.114.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.114.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.114.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.114.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.114.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.114.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.115.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.115.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.115.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.115.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.115.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.115.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.116.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.116.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.116.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.116.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.116.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.116.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.117.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.117.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.117.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.117.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.117.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.117.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.118.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.118.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.118.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.118.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.118.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.118.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.119.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.119.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.119.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.119.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.119.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.119.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.12.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.12.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.12.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.12.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.12.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.12.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.120.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.120.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.120.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.120.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.120.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.120.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.121.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.121.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.121.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.121.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.121.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.121.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.122.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.122.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.122.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.122.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.122.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.122.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.123.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.123.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.123.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.123.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.123.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.123.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.124.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.124.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.124.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.124.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.124.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.124.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.125.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.125.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.125.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.125.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.125.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.125.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.126.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.126.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.126.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.126.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.126.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.126.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.127.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.127.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.127.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.127.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.127.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.127.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.128.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.128.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.128.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.128.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.128.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.128.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.129.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.129.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.129.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.129.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.129.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.129.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.13.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.13.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.13.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.13.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.13.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.13.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.130.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.130.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.130.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.130.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.130.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.130.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.131.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.131.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.131.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.131.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.131.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.131.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.132.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.132.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.132.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.132.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.132.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.132.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.133.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.133.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.133.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.133.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.133.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.133.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.134.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.134.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.134.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.134.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.134.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.134.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.135.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.135.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.135.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.135.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.135.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.135.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.136.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.136.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.136.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.136.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.136.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.136.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.137.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.137.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.137.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.137.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.137.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.137.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.138.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.138.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.138.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.138.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.138.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.138.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.139.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.139.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.139.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.139.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.139.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.139.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.14.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.14.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.14.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.14.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.14.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.14.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.140.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.140.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.140.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.140.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.140.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.140.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.141.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.141.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.141.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.141.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.141.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.141.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.142.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.142.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.142.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.142.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.142.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.142.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.143.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.143.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.143.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.143.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.143.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.143.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.144.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.144.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.144.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.144.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.144.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.144.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.145.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.145.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.145.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.145.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.145.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.145.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.146.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.146.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.146.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.146.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.146.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.146.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.147.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.147.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.147.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.147.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.147.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.147.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.148.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.148.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.148.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.148.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.148.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.148.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.149.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.149.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.149.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.149.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.149.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.149.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.15.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.15.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.15.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.15.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.15.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.15.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.150.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.150.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.150.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.150.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.150.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.150.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.151.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.151.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.151.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.151.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.151.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.151.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.152.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.152.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.152.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.152.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.152.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.152.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.153.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.153.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.153.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.153.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.153.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.153.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.154.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.154.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.154.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.154.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.154.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.154.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.155.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.155.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.155.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.155.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.155.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.155.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.156.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.156.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.156.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.156.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.156.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.156.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.157.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.157.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.157.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.157.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.157.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.157.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.158.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.158.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.158.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.158.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.158.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.158.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.159.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.159.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.159.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.159.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.159.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.159.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.16.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.16.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.16.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.16.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.16.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.16.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.17.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.17.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.17.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.17.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.17.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.17.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.18.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.18.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.18.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.18.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.18.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.18.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.19.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.19.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.19.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.19.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.19.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.19.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.2.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.2.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.2.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.2.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.2.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.2.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.20.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.20.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.20.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.20.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.20.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.20.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.21.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.21.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.21.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.21.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.21.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.21.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.22.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.22.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.22.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.22.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.22.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.22.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.23.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.23.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.23.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.23.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.23.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.23.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.24.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.24.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.24.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.24.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.24.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.24.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.25.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.25.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.25.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.25.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.25.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.25.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.26.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.26.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.26.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.26.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.26.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.26.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.27.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.27.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.27.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.27.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.27.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.27.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.28.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.28.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.28.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.28.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.28.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.28.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.29.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.29.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.29.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.29.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.29.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.29.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.3.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.3.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.3.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.3.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.3.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.3.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.30.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.30.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.30.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.30.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.30.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.30.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.31.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.31.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.31.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.31.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.31.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.31.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.32.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.32.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.32.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.32.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.32.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.32.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.33.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.33.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.33.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.33.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.33.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.33.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.34.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.34.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.34.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.34.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.34.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.34.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.35.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.35.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.35.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.35.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.35.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.35.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.36.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.36.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.36.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.36.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.36.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.36.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.37.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.37.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.37.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.37.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.37.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.37.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.38.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.38.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.38.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.38.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.38.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.38.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.39.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.39.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.39.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.39.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.39.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.39.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.4.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.4.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.4.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.4.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.4.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.4.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.40.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.40.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.40.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.40.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.40.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.40.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.41.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.41.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.41.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.41.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.41.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.41.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.42.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.42.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.42.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.42.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.42.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.42.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.43.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.43.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.43.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.43.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.43.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.43.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.44.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.44.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.44.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.44.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.44.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.44.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.45.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.45.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.45.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.45.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.45.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.45.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.46.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.46.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.46.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.46.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.46.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.46.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.47.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.47.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.47.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.47.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.47.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.47.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.48.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.48.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.48.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.48.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.48.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.48.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.49.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.49.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.49.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.49.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.49.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.49.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.5.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.5.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.5.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.5.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.5.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.5.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.50.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.50.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.50.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.50.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.50.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.50.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.51.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.51.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.51.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.51.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.51.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.51.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.52.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.52.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.52.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.52.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.52.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.52.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.53.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.53.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.53.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.53.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.53.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.53.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.54.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.54.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.54.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.54.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.54.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.54.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.55.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.55.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.55.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.55.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.55.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.55.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.56.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.56.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.56.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.56.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.56.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.56.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.57.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.57.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.57.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.57.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.57.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.57.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.58.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.58.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.58.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.58.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.58.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.58.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.59.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.59.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.59.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.59.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.59.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.59.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.6.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.6.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.6.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.6.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.6.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.6.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.60.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.60.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.60.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.60.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.60.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.60.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.61.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.61.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.61.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.61.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.61.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.61.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.62.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.62.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.62.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.62.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.62.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.62.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.63.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.63.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.63.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.63.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.63.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.63.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.64.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.64.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.64.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.64.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.64.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.64.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.65.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.65.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.65.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.65.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.65.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.65.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.66.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.66.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.66.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.66.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.66.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.66.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.67.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.67.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.67.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.67.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.67.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.67.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.68.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.68.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.68.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.68.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.68.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.68.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.69.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.69.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.69.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.69.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.69.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.69.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.7.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.7.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.7.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.7.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.7.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.7.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.70.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.70.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.70.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.70.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.70.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.70.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.71.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.71.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.71.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.71.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.71.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.71.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.72.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.72.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.72.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.72.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.72.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.72.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.73.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.73.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.73.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.73.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.73.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.73.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.74.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.74.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.74.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.74.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.74.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.74.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.75.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.75.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.75.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.75.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.75.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.75.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.76.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.76.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.76.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.76.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.76.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.76.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.77.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.77.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.77.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.77.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.77.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.77.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.78.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.78.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.78.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.78.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.78.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.78.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.79.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.79.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.79.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.79.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.79.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.79.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.8.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.8.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.8.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.8.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.8.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.8.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.80.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.80.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.80.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.80.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.80.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.80.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.81.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.81.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.81.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.81.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.81.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.81.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.82.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.82.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.82.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.82.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.82.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.82.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.83.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.83.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.83.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.83.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.83.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.83.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.84.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.84.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.84.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.84.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.84.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.84.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.85.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.85.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.85.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.85.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.85.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.85.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.86.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.86.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.86.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.86.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.86.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.86.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.87.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.87.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.87.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.87.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.87.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.87.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.88.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.88.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.88.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.88.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.88.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.88.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.89.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.89.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.89.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.89.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.89.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.89.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.9.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.9.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.9.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.9.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.9.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.9.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.90.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.90.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.90.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.90.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.90.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.90.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.91.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.91.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.91.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.91.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.91.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.91.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.92.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.92.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.92.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.92.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.92.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.92.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.93.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.93.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.93.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.93.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.93.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.93.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.94.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.94.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.94.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.94.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.94.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.94.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.95.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.95.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.95.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.95.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.95.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.95.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.96.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.96.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.96.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.96.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.96.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.96.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.97.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.97.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.97.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.97.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.97.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.97.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.98.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.98.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.98.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.98.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.98.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.98.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.99.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.99.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.99.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.99.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.99.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.experts.99.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.gate.e_score_correction_bias": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.gate.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.shared_experts.down_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.shared_experts.down_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.shared_experts.gate_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.shared_experts.gate_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.shared_experts.up_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.mlp.shared_experts.up_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.post_attention_layernorm.weight": "model-00027-of-00092.safetensors", + "model.layers.26.self_attn.k_norm.weight": "model-00027-of-00092.safetensors", + "model.layers.26.self_attn.k_proj.bias": "model-00027-of-00092.safetensors", + "model.layers.26.self_attn.k_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.self_attn.k_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.self_attn.o_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.self_attn.o_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.self_attn.q_norm.weight": "model-00027-of-00092.safetensors", + "model.layers.26.self_attn.q_proj.bias": "model-00027-of-00092.safetensors", + "model.layers.26.self_attn.q_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.self_attn.q_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.26.self_attn.v_proj.bias": "model-00027-of-00092.safetensors", + "model.layers.26.self_attn.v_proj.weight": "model-00027-of-00092.safetensors", + "model.layers.26.self_attn.v_proj.weight_scale": "model-00027-of-00092.safetensors", + "model.layers.27.input_layernorm.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.0.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.0.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.0.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.0.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.0.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.0.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.1.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.1.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.1.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.1.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.1.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.1.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.10.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.10.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.10.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.10.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.10.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.10.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.100.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.100.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.100.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.100.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.100.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.100.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.101.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.101.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.101.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.101.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.101.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.101.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.102.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.102.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.102.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.102.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.102.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.102.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.103.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.103.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.103.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.103.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.103.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.103.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.104.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.104.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.104.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.104.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.104.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.104.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.105.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.105.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.105.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.105.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.105.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.105.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.106.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.106.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.106.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.106.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.106.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.106.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.107.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.107.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.107.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.107.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.107.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.107.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.108.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.108.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.108.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.108.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.108.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.108.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.109.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.109.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.109.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.109.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.109.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.109.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.11.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.11.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.11.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.11.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.11.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.11.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.110.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.110.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.110.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.110.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.110.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.110.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.111.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.111.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.111.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.111.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.111.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.111.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.112.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.112.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.112.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.112.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.112.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.112.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.113.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.113.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.113.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.113.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.113.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.113.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.114.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.114.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.114.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.114.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.114.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.114.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.115.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.115.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.115.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.115.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.115.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.115.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.116.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.116.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.116.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.116.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.116.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.116.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.117.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.117.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.117.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.117.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.117.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.117.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.118.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.118.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.118.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.118.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.118.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.118.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.119.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.119.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.119.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.119.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.119.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.119.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.12.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.12.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.12.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.12.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.12.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.12.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.120.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.120.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.120.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.120.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.120.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.120.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.121.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.121.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.121.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.121.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.121.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.121.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.122.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.122.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.122.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.122.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.122.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.122.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.123.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.123.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.123.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.123.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.123.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.123.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.124.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.124.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.124.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.124.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.124.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.124.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.125.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.125.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.125.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.125.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.125.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.125.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.126.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.126.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.126.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.126.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.126.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.126.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.127.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.127.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.127.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.127.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.127.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.127.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.128.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.128.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.128.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.128.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.128.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.128.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.129.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.129.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.129.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.129.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.129.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.129.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.13.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.13.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.13.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.13.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.13.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.13.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.130.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.130.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.130.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.130.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.130.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.130.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.131.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.131.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.131.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.131.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.131.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.131.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.132.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.132.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.132.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.132.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.132.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.132.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.133.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.133.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.133.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.133.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.133.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.133.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.134.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.134.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.134.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.134.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.134.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.134.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.135.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.135.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.135.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.135.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.135.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.135.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.136.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.136.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.136.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.136.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.136.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.136.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.137.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.137.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.137.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.137.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.137.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.137.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.138.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.138.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.138.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.138.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.138.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.138.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.139.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.139.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.139.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.139.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.139.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.139.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.14.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.14.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.14.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.14.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.14.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.14.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.140.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.140.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.140.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.140.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.140.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.140.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.141.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.141.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.141.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.141.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.141.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.141.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.142.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.142.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.142.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.142.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.142.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.142.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.143.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.143.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.143.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.143.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.143.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.143.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.144.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.144.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.144.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.144.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.144.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.144.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.145.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.145.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.145.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.145.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.145.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.145.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.146.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.146.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.146.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.146.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.146.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.146.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.147.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.147.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.147.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.147.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.147.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.147.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.148.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.148.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.148.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.148.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.148.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.148.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.149.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.149.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.149.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.149.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.149.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.149.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.15.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.15.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.15.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.15.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.15.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.15.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.150.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.150.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.150.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.150.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.150.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.150.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.151.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.151.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.151.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.151.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.151.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.151.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.152.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.152.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.152.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.152.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.152.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.152.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.153.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.153.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.153.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.153.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.153.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.153.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.154.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.154.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.154.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.154.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.154.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.154.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.155.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.155.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.155.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.155.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.155.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.155.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.156.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.156.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.156.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.156.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.156.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.156.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.157.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.157.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.157.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.157.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.157.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.157.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.158.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.158.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.158.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.158.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.158.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.158.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.159.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.159.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.159.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.159.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.159.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.159.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.16.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.16.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.16.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.16.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.16.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.16.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.17.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.17.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.17.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.17.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.17.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.17.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.18.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.18.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.18.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.18.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.18.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.18.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.19.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.19.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.19.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.19.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.19.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.19.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.2.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.2.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.2.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.2.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.2.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.2.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.20.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.20.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.20.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.20.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.20.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.20.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.21.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.21.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.21.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.21.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.21.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.21.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.22.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.22.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.22.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.22.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.22.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.22.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.23.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.23.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.23.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.23.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.23.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.23.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.24.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.24.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.24.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.24.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.24.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.24.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.25.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.25.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.25.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.25.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.25.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.25.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.26.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.26.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.26.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.26.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.26.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.26.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.27.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.27.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.27.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.27.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.27.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.27.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.28.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.28.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.28.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.28.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.28.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.28.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.29.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.29.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.29.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.29.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.29.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.29.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.3.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.3.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.3.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.3.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.3.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.3.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.30.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.30.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.30.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.30.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.30.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.30.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.31.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.31.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.31.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.31.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.31.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.31.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.32.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.32.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.32.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.32.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.32.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.32.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.33.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.33.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.33.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.33.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.33.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.33.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.34.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.34.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.34.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.34.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.34.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.34.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.35.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.35.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.35.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.35.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.35.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.35.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.36.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.36.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.36.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.36.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.36.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.36.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.37.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.37.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.37.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.37.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.37.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.37.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.38.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.38.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.38.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.38.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.38.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.38.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.39.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.39.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.39.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.39.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.39.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.39.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.4.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.4.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.4.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.4.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.4.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.4.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.40.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.40.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.40.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.40.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.40.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.40.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.41.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.41.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.41.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.41.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.41.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.41.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.42.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.42.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.42.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.42.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.42.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.42.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.43.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.43.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.43.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.43.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.43.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.43.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.44.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.44.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.44.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.44.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.44.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.44.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.45.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.45.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.45.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.45.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.45.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.45.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.46.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.46.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.46.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.46.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.46.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.46.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.47.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.47.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.47.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.47.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.47.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.47.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.48.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.48.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.48.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.48.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.48.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.48.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.49.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.49.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.49.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.49.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.49.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.49.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.5.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.5.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.5.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.5.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.5.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.5.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.50.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.50.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.50.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.50.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.50.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.50.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.51.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.51.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.51.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.51.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.51.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.51.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.52.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.52.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.52.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.52.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.52.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.52.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.53.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.53.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.53.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.53.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.53.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.53.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.54.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.54.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.54.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.54.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.54.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.54.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.55.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.55.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.55.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.55.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.55.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.55.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.56.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.56.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.56.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.56.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.56.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.56.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.57.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.57.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.57.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.57.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.57.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.57.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.58.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.58.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.58.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.58.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.58.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.58.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.59.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.59.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.59.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.59.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.59.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.59.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.6.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.6.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.6.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.6.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.6.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.6.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.60.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.60.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.60.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.60.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.60.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.60.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.61.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.61.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.61.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.61.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.61.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.61.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.62.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.62.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.62.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.62.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.62.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.62.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.63.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.63.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.63.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.63.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.63.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.63.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.64.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.64.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.64.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.64.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.64.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.64.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.65.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.65.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.65.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.65.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.65.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.65.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.66.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.66.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.66.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.66.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.66.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.66.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.67.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.67.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.67.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.67.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.67.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.67.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.68.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.68.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.68.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.68.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.68.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.68.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.69.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.69.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.69.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.69.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.69.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.69.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.7.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.7.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.7.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.7.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.7.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.7.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.70.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.70.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.70.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.70.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.70.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.70.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.71.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.71.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.71.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.71.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.71.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.71.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.72.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.72.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.72.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.72.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.72.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.72.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.73.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.73.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.73.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.73.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.73.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.73.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.74.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.74.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.74.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.74.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.74.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.74.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.75.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.75.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.75.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.75.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.75.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.75.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.76.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.76.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.76.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.76.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.76.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.76.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.77.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.77.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.77.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.77.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.77.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.77.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.78.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.78.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.78.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.78.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.78.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.78.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.79.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.79.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.79.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.79.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.79.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.79.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.8.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.8.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.8.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.8.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.8.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.8.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.80.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.80.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.80.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.80.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.80.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.80.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.81.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.81.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.81.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.81.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.81.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.81.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.82.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.82.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.82.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.82.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.82.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.82.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.83.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.83.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.83.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.83.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.83.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.83.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.84.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.84.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.84.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.84.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.84.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.84.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.85.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.85.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.85.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.85.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.85.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.85.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.86.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.86.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.86.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.86.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.86.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.86.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.87.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.87.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.87.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.87.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.87.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.87.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.88.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.88.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.88.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.88.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.88.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.88.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.89.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.89.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.89.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.89.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.89.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.89.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.9.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.9.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.9.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.9.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.9.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.9.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.90.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.90.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.90.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.90.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.90.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.90.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.91.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.91.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.91.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.91.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.91.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.91.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.92.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.92.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.92.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.92.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.92.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.92.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.93.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.93.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.93.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.93.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.93.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.93.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.94.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.94.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.94.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.94.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.94.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.94.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.95.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.95.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.95.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.95.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.95.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.95.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.96.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.96.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.96.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.96.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.96.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.96.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.97.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.97.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.97.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.97.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.97.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.97.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.98.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.98.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.98.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.98.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.98.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.98.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.99.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.99.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.99.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.99.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.99.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.experts.99.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.gate.e_score_correction_bias": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.gate.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.shared_experts.down_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.shared_experts.down_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.shared_experts.gate_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.shared_experts.gate_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.shared_experts.up_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.mlp.shared_experts.up_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.post_attention_layernorm.weight": "model-00028-of-00092.safetensors", + "model.layers.27.self_attn.k_norm.weight": "model-00028-of-00092.safetensors", + "model.layers.27.self_attn.k_proj.bias": "model-00028-of-00092.safetensors", + "model.layers.27.self_attn.k_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.self_attn.k_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.self_attn.o_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.self_attn.o_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.self_attn.q_norm.weight": "model-00028-of-00092.safetensors", + "model.layers.27.self_attn.q_proj.bias": "model-00028-of-00092.safetensors", + "model.layers.27.self_attn.q_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.self_attn.q_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.27.self_attn.v_proj.bias": "model-00028-of-00092.safetensors", + "model.layers.27.self_attn.v_proj.weight": "model-00028-of-00092.safetensors", + "model.layers.27.self_attn.v_proj.weight_scale": "model-00028-of-00092.safetensors", + "model.layers.28.input_layernorm.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.0.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.0.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.0.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.0.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.0.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.0.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.1.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.1.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.1.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.1.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.1.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.1.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.10.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.10.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.10.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.10.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.10.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.10.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.100.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.100.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.100.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.100.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.100.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.100.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.101.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.101.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.101.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.101.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.101.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.101.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.102.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.102.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.102.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.102.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.102.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.102.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.103.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.103.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.103.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.103.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.103.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.103.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.104.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.104.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.104.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.104.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.104.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.104.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.105.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.105.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.105.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.105.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.105.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.105.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.106.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.106.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.106.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.106.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.106.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.106.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.107.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.107.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.107.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.107.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.107.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.107.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.108.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.108.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.108.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.108.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.108.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.108.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.109.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.109.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.109.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.109.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.109.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.109.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.11.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.11.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.11.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.11.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.11.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.11.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.110.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.110.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.110.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.110.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.110.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.110.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.111.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.111.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.111.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.111.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.111.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.111.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.112.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.112.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.112.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.112.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.112.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.112.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.113.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.113.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.113.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.113.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.113.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.113.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.114.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.114.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.114.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.114.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.114.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.114.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.115.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.115.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.115.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.115.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.115.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.115.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.116.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.116.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.116.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.116.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.116.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.116.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.117.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.117.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.117.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.117.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.117.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.117.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.118.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.118.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.118.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.118.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.118.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.118.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.119.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.119.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.119.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.119.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.119.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.119.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.12.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.12.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.12.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.12.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.12.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.12.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.120.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.120.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.120.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.120.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.120.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.120.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.121.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.121.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.121.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.121.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.121.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.121.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.122.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.122.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.122.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.122.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.122.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.122.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.123.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.123.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.123.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.123.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.123.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.123.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.124.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.124.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.124.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.124.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.124.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.124.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.125.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.125.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.125.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.125.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.125.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.125.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.126.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.126.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.126.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.126.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.126.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.126.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.127.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.127.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.127.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.127.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.127.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.127.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.128.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.128.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.128.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.128.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.128.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.128.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.129.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.129.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.129.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.129.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.129.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.129.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.13.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.13.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.13.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.13.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.13.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.13.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.130.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.130.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.130.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.130.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.130.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.130.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.131.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.131.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.131.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.131.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.131.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.131.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.132.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.132.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.132.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.132.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.132.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.132.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.133.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.133.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.133.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.133.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.133.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.133.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.134.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.134.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.134.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.134.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.134.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.134.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.135.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.135.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.135.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.135.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.135.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.135.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.136.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.136.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.136.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.136.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.136.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.136.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.137.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.137.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.137.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.137.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.137.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.137.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.138.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.138.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.138.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.138.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.138.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.138.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.139.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.139.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.139.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.139.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.139.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.139.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.14.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.14.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.14.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.14.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.14.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.14.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.140.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.140.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.140.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.140.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.140.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.140.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.141.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.141.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.141.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.141.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.141.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.141.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.142.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.142.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.142.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.142.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.142.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.142.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.143.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.143.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.143.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.143.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.143.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.143.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.144.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.144.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.144.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.144.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.144.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.144.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.145.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.145.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.145.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.145.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.145.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.145.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.146.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.146.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.146.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.146.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.146.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.146.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.147.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.147.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.147.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.147.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.147.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.147.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.148.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.148.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.148.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.148.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.148.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.148.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.149.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.149.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.149.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.149.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.149.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.149.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.15.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.15.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.15.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.15.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.15.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.15.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.150.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.150.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.150.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.150.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.150.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.150.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.151.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.151.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.151.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.151.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.151.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.151.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.152.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.152.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.152.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.152.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.152.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.152.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.153.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.153.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.153.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.153.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.153.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.153.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.154.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.154.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.154.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.154.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.154.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.154.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.155.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.155.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.155.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.155.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.155.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.155.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.156.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.156.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.156.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.156.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.156.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.156.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.157.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.157.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.157.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.157.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.157.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.157.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.158.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.158.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.158.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.158.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.158.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.158.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.159.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.159.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.159.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.159.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.159.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.159.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.16.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.16.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.16.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.16.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.16.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.16.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.17.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.17.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.17.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.17.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.17.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.17.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.18.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.18.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.18.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.18.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.18.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.18.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.19.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.19.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.19.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.19.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.19.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.19.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.2.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.2.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.2.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.2.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.2.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.2.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.20.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.20.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.20.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.20.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.20.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.20.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.21.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.21.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.21.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.21.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.21.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.21.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.22.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.22.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.22.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.22.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.22.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.22.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.23.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.23.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.23.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.23.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.23.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.23.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.24.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.24.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.24.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.24.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.24.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.24.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.25.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.25.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.25.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.25.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.25.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.25.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.26.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.26.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.26.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.26.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.26.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.26.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.27.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.27.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.27.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.27.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.27.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.27.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.28.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.28.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.28.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.28.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.28.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.28.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.29.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.29.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.29.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.29.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.29.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.29.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.3.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.3.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.3.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.3.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.3.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.3.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.30.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.30.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.30.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.30.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.30.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.30.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.31.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.31.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.31.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.31.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.31.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.31.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.32.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.32.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.32.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.32.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.32.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.32.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.33.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.33.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.33.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.33.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.33.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.33.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.34.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.34.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.34.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.34.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.34.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.34.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.35.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.35.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.35.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.35.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.35.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.35.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.36.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.36.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.36.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.36.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.36.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.36.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.37.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.37.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.37.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.37.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.37.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.37.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.38.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.38.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.38.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.38.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.38.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.38.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.39.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.39.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.39.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.39.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.39.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.39.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.4.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.4.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.4.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.4.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.4.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.4.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.40.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.40.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.40.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.40.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.40.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.40.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.41.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.41.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.41.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.41.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.41.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.41.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.42.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.42.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.42.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.42.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.42.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.42.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.43.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.43.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.43.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.43.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.43.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.43.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.44.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.44.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.44.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.44.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.44.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.44.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.45.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.45.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.45.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.45.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.45.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.45.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.46.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.46.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.46.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.46.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.46.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.46.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.47.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.47.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.47.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.47.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.47.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.47.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.48.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.48.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.48.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.48.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.48.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.48.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.49.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.49.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.49.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.49.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.49.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.49.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.5.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.5.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.5.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.5.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.5.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.5.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.50.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.50.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.50.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.50.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.50.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.50.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.51.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.51.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.51.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.51.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.51.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.51.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.52.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.52.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.52.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.52.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.52.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.52.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.53.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.53.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.53.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.53.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.53.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.53.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.54.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.54.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.54.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.54.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.54.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.54.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.55.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.55.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.55.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.55.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.55.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.55.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.56.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.56.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.56.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.56.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.56.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.56.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.57.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.57.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.57.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.57.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.57.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.57.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.58.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.58.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.58.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.58.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.58.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.58.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.59.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.59.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.59.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.59.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.59.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.59.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.6.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.6.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.6.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.6.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.6.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.6.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.60.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.60.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.60.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.60.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.60.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.60.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.61.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.61.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.61.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.61.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.61.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.61.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.62.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.62.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.62.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.62.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.62.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.62.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.63.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.63.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.63.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.63.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.63.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.63.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.64.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.64.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.64.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.64.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.64.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.64.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.65.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.65.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.65.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.65.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.65.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.65.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.66.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.66.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.66.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.66.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.66.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.66.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.67.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.67.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.67.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.67.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.67.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.67.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.68.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.68.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.68.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.68.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.68.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.68.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.69.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.69.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.69.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.69.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.69.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.69.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.7.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.7.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.7.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.7.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.7.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.7.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.70.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.70.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.70.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.70.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.70.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.70.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.71.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.71.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.71.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.71.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.71.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.71.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.72.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.72.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.72.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.72.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.72.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.72.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.73.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.73.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.73.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.73.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.73.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.73.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.74.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.74.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.74.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.74.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.74.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.74.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.75.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.75.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.75.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.75.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.75.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.75.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.76.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.76.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.76.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.76.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.76.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.76.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.77.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.77.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.77.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.77.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.77.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.77.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.78.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.78.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.78.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.78.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.78.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.78.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.79.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.79.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.79.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.79.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.79.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.79.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.8.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.8.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.8.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.8.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.8.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.8.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.80.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.80.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.80.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.80.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.80.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.80.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.81.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.81.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.81.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.81.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.81.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.81.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.82.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.82.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.82.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.82.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.82.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.82.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.83.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.83.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.83.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.83.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.83.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.83.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.84.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.84.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.84.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.84.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.84.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.84.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.85.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.85.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.85.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.85.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.85.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.85.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.86.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.86.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.86.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.86.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.86.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.86.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.87.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.87.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.87.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.87.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.87.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.87.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.88.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.88.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.88.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.88.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.88.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.88.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.89.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.89.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.89.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.89.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.89.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.89.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.9.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.9.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.9.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.9.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.9.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.9.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.90.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.90.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.90.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.90.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.90.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.90.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.91.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.91.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.91.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.91.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.91.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.91.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.92.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.92.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.92.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.92.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.92.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.92.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.93.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.93.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.93.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.93.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.93.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.93.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.94.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.94.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.94.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.94.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.94.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.94.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.95.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.95.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.95.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.95.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.95.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.95.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.96.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.96.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.96.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.96.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.96.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.96.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.97.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.97.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.97.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.97.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.97.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.97.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.98.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.98.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.98.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.98.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.98.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.98.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.99.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.99.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.99.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.99.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.99.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.experts.99.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.gate.e_score_correction_bias": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.gate.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.shared_experts.down_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.shared_experts.down_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.shared_experts.gate_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.shared_experts.gate_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.shared_experts.up_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.mlp.shared_experts.up_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.post_attention_layernorm.weight": "model-00029-of-00092.safetensors", + "model.layers.28.self_attn.k_norm.weight": "model-00029-of-00092.safetensors", + "model.layers.28.self_attn.k_proj.bias": "model-00029-of-00092.safetensors", + "model.layers.28.self_attn.k_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.self_attn.k_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.self_attn.o_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.self_attn.o_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.self_attn.q_norm.weight": "model-00029-of-00092.safetensors", + "model.layers.28.self_attn.q_proj.bias": "model-00029-of-00092.safetensors", + "model.layers.28.self_attn.q_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.self_attn.q_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.28.self_attn.v_proj.bias": "model-00029-of-00092.safetensors", + "model.layers.28.self_attn.v_proj.weight": "model-00029-of-00092.safetensors", + "model.layers.28.self_attn.v_proj.weight_scale": "model-00029-of-00092.safetensors", + "model.layers.29.input_layernorm.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.0.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.0.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.0.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.0.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.0.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.0.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.1.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.1.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.1.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.1.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.1.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.1.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.10.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.10.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.10.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.10.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.10.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.10.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.100.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.100.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.100.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.100.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.100.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.100.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.101.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.101.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.101.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.101.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.101.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.101.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.102.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.102.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.102.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.102.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.102.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.102.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.103.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.103.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.103.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.103.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.103.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.103.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.104.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.104.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.104.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.104.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.104.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.104.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.105.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.105.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.105.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.105.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.105.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.105.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.106.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.106.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.106.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.106.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.106.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.106.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.107.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.107.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.107.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.107.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.107.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.107.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.108.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.108.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.108.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.108.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.108.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.108.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.109.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.109.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.109.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.109.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.109.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.109.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.11.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.11.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.11.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.11.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.11.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.11.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.110.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.110.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.110.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.110.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.110.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.110.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.111.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.111.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.111.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.111.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.111.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.111.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.112.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.112.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.112.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.112.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.112.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.112.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.113.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.113.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.113.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.113.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.113.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.113.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.114.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.114.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.114.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.114.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.114.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.114.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.115.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.115.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.115.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.115.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.115.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.115.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.116.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.116.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.116.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.116.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.116.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.116.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.117.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.117.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.117.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.117.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.117.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.117.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.118.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.118.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.118.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.118.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.118.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.118.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.119.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.119.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.119.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.119.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.119.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.119.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.12.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.12.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.12.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.12.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.12.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.12.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.120.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.120.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.120.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.120.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.120.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.120.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.121.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.121.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.121.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.121.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.121.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.121.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.122.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.122.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.122.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.122.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.122.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.122.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.123.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.123.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.123.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.123.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.123.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.123.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.124.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.124.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.124.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.124.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.124.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.124.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.125.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.125.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.125.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.125.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.125.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.125.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.126.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.126.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.126.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.126.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.126.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.126.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.127.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.127.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.127.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.127.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.127.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.127.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.128.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.128.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.128.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.128.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.128.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.128.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.129.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.129.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.129.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.129.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.129.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.129.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.13.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.13.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.13.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.13.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.13.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.13.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.130.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.130.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.130.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.130.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.130.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.130.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.131.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.131.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.131.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.131.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.131.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.131.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.132.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.132.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.132.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.132.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.132.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.132.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.133.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.133.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.133.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.133.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.133.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.133.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.134.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.134.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.134.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.134.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.134.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.134.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.135.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.135.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.135.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.135.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.135.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.135.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.136.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.136.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.136.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.136.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.136.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.136.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.137.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.137.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.137.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.137.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.137.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.137.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.138.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.138.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.138.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.138.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.138.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.138.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.139.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.139.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.139.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.139.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.139.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.139.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.14.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.14.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.14.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.14.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.14.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.14.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.140.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.140.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.140.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.140.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.140.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.140.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.141.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.141.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.141.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.141.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.141.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.141.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.142.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.142.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.142.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.142.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.142.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.142.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.143.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.143.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.143.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.143.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.143.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.143.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.144.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.144.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.144.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.144.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.144.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.144.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.145.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.145.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.145.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.145.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.145.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.145.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.146.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.146.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.146.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.146.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.146.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.146.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.147.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.147.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.147.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.147.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.147.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.147.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.148.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.148.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.148.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.148.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.148.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.148.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.149.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.149.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.149.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.149.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.149.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.149.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.15.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.15.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.15.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.15.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.15.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.15.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.150.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.150.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.150.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.150.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.150.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.150.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.151.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.151.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.151.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.151.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.151.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.151.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.152.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.152.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.152.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.152.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.152.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.152.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.153.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.153.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.153.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.153.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.153.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.153.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.154.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.154.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.154.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.154.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.154.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.154.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.155.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.155.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.155.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.155.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.155.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.155.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.156.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.156.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.156.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.156.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.156.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.156.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.157.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.157.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.157.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.157.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.157.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.157.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.158.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.158.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.158.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.158.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.158.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.158.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.159.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.159.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.159.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.159.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.159.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.159.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.16.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.16.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.16.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.16.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.16.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.16.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.17.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.17.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.17.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.17.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.17.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.17.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.18.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.18.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.18.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.18.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.18.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.18.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.19.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.19.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.19.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.19.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.19.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.19.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.2.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.2.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.2.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.2.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.2.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.2.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.20.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.20.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.20.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.20.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.20.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.20.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.21.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.21.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.21.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.21.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.21.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.21.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.22.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.22.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.22.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.22.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.22.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.22.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.23.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.23.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.23.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.23.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.23.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.23.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.24.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.24.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.24.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.24.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.24.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.24.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.25.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.25.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.25.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.25.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.25.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.25.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.26.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.26.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.26.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.26.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.26.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.26.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.27.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.27.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.27.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.27.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.27.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.27.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.28.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.28.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.28.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.28.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.28.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.28.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.29.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.29.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.29.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.29.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.29.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.29.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.3.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.3.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.3.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.3.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.3.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.3.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.30.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.30.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.30.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.30.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.30.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.30.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.31.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.31.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.31.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.31.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.31.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.31.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.32.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.32.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.32.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.32.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.32.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.32.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.33.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.33.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.33.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.33.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.33.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.33.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.34.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.34.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.34.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.34.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.34.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.34.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.35.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.35.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.35.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.35.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.35.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.35.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.36.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.36.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.36.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.36.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.36.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.36.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.37.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.37.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.37.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.37.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.37.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.37.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.38.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.38.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.38.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.38.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.38.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.38.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.39.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.39.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.39.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.39.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.39.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.39.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.4.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.4.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.4.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.4.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.4.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.4.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.40.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.40.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.40.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.40.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.40.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.40.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.41.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.41.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.41.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.41.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.41.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.41.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.42.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.42.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.42.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.42.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.42.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.42.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.43.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.43.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.43.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.43.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.43.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.43.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.44.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.44.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.44.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.44.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.44.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.44.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.45.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.45.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.45.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.45.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.45.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.45.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.46.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.46.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.46.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.46.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.46.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.46.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.47.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.47.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.47.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.47.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.47.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.47.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.48.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.48.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.48.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.48.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.48.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.48.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.49.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.49.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.49.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.49.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.49.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.49.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.5.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.5.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.5.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.5.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.5.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.5.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.50.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.50.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.50.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.50.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.50.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.50.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.51.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.51.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.51.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.51.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.51.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.51.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.52.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.52.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.52.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.52.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.52.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.52.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.53.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.53.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.53.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.53.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.53.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.53.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.54.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.54.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.54.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.54.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.54.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.54.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.55.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.55.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.55.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.55.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.55.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.55.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.56.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.56.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.56.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.56.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.56.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.56.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.57.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.57.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.57.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.57.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.57.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.57.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.58.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.58.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.58.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.58.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.58.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.58.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.59.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.59.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.59.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.59.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.59.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.59.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.6.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.6.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.6.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.6.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.6.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.6.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.60.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.60.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.60.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.60.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.60.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.60.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.61.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.61.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.61.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.61.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.61.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.61.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.62.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.62.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.62.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.62.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.62.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.62.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.63.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.63.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.63.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.63.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.63.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.63.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.64.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.64.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.64.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.64.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.64.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.64.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.65.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.65.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.65.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.65.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.65.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.65.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.66.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.66.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.66.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.66.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.66.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.66.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.67.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.67.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.67.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.67.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.67.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.67.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.68.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.68.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.68.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.68.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.68.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.68.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.69.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.69.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.69.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.69.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.69.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.69.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.7.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.7.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.7.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.7.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.7.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.7.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.70.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.70.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.70.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.70.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.70.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.70.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.71.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.71.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.71.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.71.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.71.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.71.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.72.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.72.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.72.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.72.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.72.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.72.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.73.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.73.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.73.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.73.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.73.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.73.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.74.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.74.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.74.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.74.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.74.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.74.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.75.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.75.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.75.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.75.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.75.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.75.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.76.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.76.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.76.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.76.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.76.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.76.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.77.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.77.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.77.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.77.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.77.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.77.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.78.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.78.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.78.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.78.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.78.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.78.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.79.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.79.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.79.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.79.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.79.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.79.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.8.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.8.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.8.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.8.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.8.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.8.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.80.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.80.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.80.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.80.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.80.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.80.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.81.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.81.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.81.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.81.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.81.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.81.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.82.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.82.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.82.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.82.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.82.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.82.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.83.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.83.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.83.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.83.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.83.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.83.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.84.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.84.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.84.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.84.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.84.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.84.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.85.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.85.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.85.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.85.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.85.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.85.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.86.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.86.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.86.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.86.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.86.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.86.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.87.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.87.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.87.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.87.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.87.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.87.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.88.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.88.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.88.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.88.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.88.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.88.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.89.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.89.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.89.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.89.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.89.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.89.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.9.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.9.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.9.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.9.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.9.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.9.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.90.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.90.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.90.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.90.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.90.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.90.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.91.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.91.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.91.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.91.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.91.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.91.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.92.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.92.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.92.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.92.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.92.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.92.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.93.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.93.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.93.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.93.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.93.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.93.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.94.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.94.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.94.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.94.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.94.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.94.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.95.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.95.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.95.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.95.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.95.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.95.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.96.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.96.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.96.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.96.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.96.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.96.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.97.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.97.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.97.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.97.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.97.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.97.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.98.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.98.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.98.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.98.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.98.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.98.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.99.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.99.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.99.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.99.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.99.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.experts.99.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.gate.e_score_correction_bias": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.gate.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.shared_experts.down_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.shared_experts.down_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.shared_experts.gate_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.shared_experts.gate_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.shared_experts.up_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.mlp.shared_experts.up_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.post_attention_layernorm.weight": "model-00030-of-00092.safetensors", + "model.layers.29.self_attn.k_norm.weight": "model-00030-of-00092.safetensors", + "model.layers.29.self_attn.k_proj.bias": "model-00030-of-00092.safetensors", + "model.layers.29.self_attn.k_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.self_attn.k_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.self_attn.o_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.self_attn.o_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.self_attn.q_norm.weight": "model-00030-of-00092.safetensors", + "model.layers.29.self_attn.q_proj.bias": "model-00030-of-00092.safetensors", + "model.layers.29.self_attn.q_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.self_attn.q_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.29.self_attn.v_proj.bias": "model-00030-of-00092.safetensors", + "model.layers.29.self_attn.v_proj.weight": "model-00030-of-00092.safetensors", + "model.layers.29.self_attn.v_proj.weight_scale": "model-00030-of-00092.safetensors", + "model.layers.30.input_layernorm.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.0.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.0.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.0.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.0.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.0.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.0.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.1.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.1.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.1.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.1.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.1.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.1.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.10.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.10.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.10.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.10.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.10.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.10.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.100.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.100.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.100.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.100.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.100.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.100.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.101.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.101.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.101.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.101.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.101.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.101.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.102.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.102.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.102.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.102.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.102.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.102.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.103.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.103.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.103.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.103.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.103.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.103.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.104.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.104.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.104.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.104.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.104.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.104.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.105.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.105.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.105.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.105.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.105.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.105.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.106.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.106.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.106.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.106.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.106.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.106.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.107.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.107.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.107.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.107.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.107.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.107.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.108.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.108.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.108.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.108.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.108.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.108.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.109.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.109.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.109.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.109.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.109.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.109.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.11.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.11.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.11.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.11.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.11.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.11.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.110.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.110.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.110.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.110.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.110.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.110.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.111.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.111.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.111.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.111.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.111.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.111.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.112.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.112.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.112.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.112.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.112.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.112.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.113.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.113.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.113.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.113.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.113.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.113.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.114.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.114.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.114.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.114.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.114.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.114.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.115.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.115.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.115.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.115.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.115.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.115.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.116.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.116.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.116.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.116.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.116.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.116.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.117.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.117.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.117.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.117.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.117.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.117.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.118.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.118.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.118.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.118.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.118.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.118.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.119.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.119.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.119.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.119.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.119.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.119.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.12.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.12.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.12.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.12.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.12.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.12.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.120.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.120.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.120.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.120.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.120.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.120.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.121.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.121.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.121.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.121.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.121.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.121.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.122.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.122.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.122.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.122.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.122.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.122.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.123.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.123.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.123.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.123.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.123.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.123.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.124.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.124.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.124.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.124.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.124.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.124.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.125.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.125.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.125.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.125.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.125.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.125.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.126.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.126.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.126.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.126.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.126.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.126.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.127.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.127.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.127.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.127.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.127.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.127.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.128.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.128.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.128.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.128.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.128.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.128.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.129.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.129.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.129.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.129.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.129.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.129.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.13.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.13.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.13.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.13.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.13.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.13.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.130.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.130.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.130.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.130.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.130.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.130.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.131.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.131.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.131.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.131.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.131.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.131.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.132.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.132.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.132.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.132.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.132.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.132.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.133.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.133.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.133.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.133.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.133.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.133.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.134.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.134.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.134.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.134.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.134.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.134.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.135.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.135.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.135.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.135.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.135.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.135.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.136.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.136.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.136.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.136.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.136.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.136.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.137.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.137.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.137.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.137.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.137.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.137.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.138.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.138.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.138.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.138.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.138.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.138.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.139.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.139.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.139.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.139.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.139.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.139.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.14.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.14.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.14.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.14.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.14.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.14.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.140.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.140.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.140.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.140.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.140.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.140.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.141.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.141.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.141.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.141.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.141.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.141.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.142.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.142.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.142.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.142.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.142.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.142.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.143.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.143.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.143.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.143.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.143.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.143.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.144.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.144.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.144.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.144.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.144.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.144.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.145.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.145.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.145.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.145.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.145.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.145.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.146.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.146.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.146.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.146.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.146.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.146.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.147.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.147.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.147.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.147.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.147.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.147.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.148.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.148.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.148.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.148.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.148.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.148.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.149.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.149.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.149.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.149.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.149.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.149.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.15.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.15.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.15.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.15.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.15.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.15.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.150.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.150.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.150.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.150.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.150.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.150.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.151.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.151.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.151.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.151.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.151.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.151.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.152.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.152.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.152.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.152.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.152.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.152.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.153.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.153.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.153.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.153.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.153.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.153.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.154.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.154.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.154.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.154.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.154.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.154.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.155.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.155.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.155.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.155.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.155.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.155.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.156.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.156.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.156.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.156.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.156.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.156.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.157.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.157.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.157.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.157.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.157.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.157.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.158.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.158.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.158.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.158.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.158.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.158.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.159.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.159.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.159.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.159.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.159.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.159.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.16.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.16.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.16.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.16.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.16.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.16.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.17.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.17.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.17.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.17.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.17.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.17.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.18.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.18.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.18.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.18.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.18.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.18.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.19.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.19.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.19.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.19.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.19.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.19.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.2.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.2.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.2.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.2.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.2.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.2.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.20.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.20.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.20.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.20.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.20.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.20.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.21.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.21.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.21.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.21.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.21.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.21.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.22.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.22.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.22.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.22.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.22.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.22.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.23.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.23.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.23.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.23.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.23.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.23.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.24.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.24.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.24.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.24.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.24.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.24.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.25.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.25.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.25.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.25.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.25.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.25.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.26.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.26.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.26.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.26.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.26.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.26.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.27.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.27.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.27.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.27.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.27.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.27.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.28.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.28.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.28.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.28.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.28.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.28.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.29.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.29.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.29.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.29.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.29.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.29.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.3.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.3.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.3.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.3.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.3.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.3.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.30.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.30.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.30.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.30.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.30.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.30.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.31.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.31.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.31.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.31.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.31.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.31.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.32.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.32.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.32.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.32.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.32.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.32.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.33.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.33.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.33.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.33.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.33.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.33.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.34.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.34.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.34.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.34.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.34.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.34.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.35.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.35.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.35.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.35.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.35.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.35.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.36.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.36.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.36.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.36.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.36.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.36.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.37.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.37.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.37.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.37.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.37.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.37.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.38.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.38.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.38.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.38.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.38.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.38.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.39.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.39.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.39.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.39.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.39.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.39.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.4.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.4.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.4.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.4.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.4.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.4.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.40.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.40.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.40.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.40.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.40.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.40.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.41.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.41.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.41.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.41.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.41.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.41.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.42.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.42.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.42.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.42.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.42.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.42.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.43.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.43.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.43.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.43.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.43.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.43.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.44.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.44.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.44.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.44.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.44.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.44.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.45.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.45.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.45.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.45.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.45.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.45.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.46.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.46.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.46.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.46.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.46.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.46.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.47.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.47.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.47.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.47.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.47.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.47.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.48.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.48.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.48.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.48.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.48.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.48.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.49.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.49.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.49.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.49.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.49.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.49.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.5.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.5.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.5.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.5.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.5.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.5.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.50.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.50.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.50.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.50.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.50.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.50.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.51.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.51.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.51.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.51.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.51.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.51.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.52.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.52.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.52.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.52.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.52.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.52.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.53.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.53.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.53.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.53.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.53.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.53.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.54.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.54.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.54.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.54.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.54.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.54.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.55.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.55.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.55.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.55.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.55.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.55.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.56.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.56.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.56.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.56.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.56.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.56.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.57.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.57.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.57.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.57.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.57.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.57.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.58.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.58.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.58.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.58.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.58.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.58.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.59.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.59.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.59.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.59.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.59.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.59.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.6.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.6.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.6.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.6.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.6.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.6.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.60.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.60.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.60.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.60.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.60.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.60.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.61.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.61.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.61.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.61.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.61.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.61.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.62.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.62.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.62.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.62.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.62.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.62.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.63.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.63.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.63.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.63.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.63.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.63.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.64.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.64.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.64.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.64.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.64.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.64.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.65.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.65.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.65.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.65.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.65.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.65.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.66.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.66.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.66.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.66.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.66.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.66.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.67.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.67.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.67.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.67.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.67.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.67.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.68.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.68.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.68.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.68.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.68.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.68.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.69.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.69.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.69.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.69.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.69.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.69.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.7.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.7.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.7.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.7.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.7.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.7.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.70.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.70.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.70.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.70.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.70.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.70.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.71.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.71.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.71.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.71.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.71.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.71.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.72.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.72.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.72.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.72.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.72.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.72.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.73.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.73.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.73.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.73.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.73.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.73.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.74.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.74.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.74.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.74.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.74.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.74.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.75.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.75.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.75.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.75.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.75.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.75.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.76.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.76.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.76.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.76.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.76.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.76.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.77.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.77.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.77.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.77.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.77.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.77.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.78.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.78.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.78.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.78.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.78.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.78.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.79.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.79.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.79.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.79.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.79.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.79.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.8.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.8.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.8.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.8.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.8.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.8.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.80.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.80.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.80.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.80.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.80.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.80.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.81.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.81.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.81.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.81.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.81.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.81.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.82.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.82.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.82.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.82.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.82.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.82.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.83.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.83.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.83.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.83.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.83.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.83.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.84.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.84.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.84.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.84.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.84.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.84.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.85.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.85.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.85.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.85.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.85.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.85.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.86.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.86.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.86.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.86.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.86.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.86.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.87.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.87.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.87.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.87.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.87.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.87.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.88.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.88.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.88.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.88.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.88.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.88.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.89.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.89.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.89.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.89.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.89.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.89.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.9.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.9.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.9.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.9.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.9.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.9.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.90.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.90.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.90.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.90.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.90.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.90.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.91.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.91.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.91.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.91.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.91.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.91.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.92.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.92.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.92.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.92.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.92.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.92.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.93.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.93.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.93.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.93.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.93.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.93.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.94.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.94.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.94.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.94.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.94.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.94.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.95.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.95.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.95.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.95.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.95.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.95.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.96.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.96.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.96.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.96.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.96.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.96.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.97.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.97.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.97.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.97.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.97.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.97.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.98.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.98.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.98.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.98.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.98.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.98.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.99.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.99.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.99.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.99.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.99.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.experts.99.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.gate.e_score_correction_bias": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.gate.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.shared_experts.down_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.shared_experts.down_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.shared_experts.gate_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.shared_experts.gate_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.shared_experts.up_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.mlp.shared_experts.up_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.post_attention_layernorm.weight": "model-00031-of-00092.safetensors", + "model.layers.30.self_attn.k_norm.weight": "model-00031-of-00092.safetensors", + "model.layers.30.self_attn.k_proj.bias": "model-00031-of-00092.safetensors", + "model.layers.30.self_attn.k_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.self_attn.k_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.self_attn.o_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.self_attn.o_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.self_attn.q_norm.weight": "model-00031-of-00092.safetensors", + "model.layers.30.self_attn.q_proj.bias": "model-00031-of-00092.safetensors", + "model.layers.30.self_attn.q_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.self_attn.q_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.30.self_attn.v_proj.bias": "model-00031-of-00092.safetensors", + "model.layers.30.self_attn.v_proj.weight": "model-00031-of-00092.safetensors", + "model.layers.30.self_attn.v_proj.weight_scale": "model-00031-of-00092.safetensors", + "model.layers.31.input_layernorm.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.0.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.0.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.0.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.0.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.0.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.0.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.1.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.1.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.1.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.1.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.1.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.1.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.10.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.10.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.10.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.10.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.10.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.10.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.100.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.100.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.100.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.100.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.100.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.100.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.101.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.101.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.101.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.101.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.101.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.101.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.102.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.102.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.102.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.102.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.102.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.102.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.103.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.103.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.103.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.103.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.103.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.103.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.104.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.104.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.104.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.104.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.104.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.104.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.105.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.105.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.105.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.105.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.105.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.105.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.106.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.106.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.106.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.106.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.106.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.106.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.107.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.107.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.107.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.107.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.107.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.107.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.108.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.108.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.108.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.108.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.108.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.108.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.109.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.109.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.109.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.109.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.109.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.109.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.11.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.11.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.11.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.11.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.11.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.11.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.110.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.110.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.110.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.110.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.110.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.110.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.111.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.111.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.111.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.111.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.111.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.111.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.112.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.112.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.112.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.112.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.112.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.112.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.113.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.113.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.113.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.113.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.113.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.113.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.114.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.114.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.114.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.114.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.114.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.114.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.115.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.115.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.115.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.115.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.115.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.115.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.116.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.116.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.116.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.116.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.116.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.116.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.117.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.117.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.117.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.117.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.117.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.117.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.118.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.118.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.118.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.118.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.118.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.118.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.119.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.119.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.119.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.119.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.119.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.119.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.12.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.12.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.12.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.12.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.12.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.12.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.120.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.120.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.120.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.120.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.120.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.120.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.121.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.121.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.121.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.121.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.121.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.121.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.122.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.122.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.122.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.122.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.122.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.122.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.123.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.123.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.123.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.123.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.123.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.123.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.124.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.124.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.124.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.124.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.124.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.124.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.125.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.125.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.125.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.125.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.125.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.125.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.126.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.126.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.126.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.126.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.126.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.126.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.127.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.127.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.127.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.127.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.127.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.127.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.128.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.128.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.128.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.128.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.128.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.128.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.129.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.129.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.129.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.129.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.129.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.129.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.13.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.13.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.13.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.13.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.13.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.13.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.130.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.130.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.130.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.130.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.130.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.130.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.131.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.131.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.131.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.131.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.131.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.131.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.132.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.132.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.132.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.132.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.132.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.132.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.133.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.133.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.133.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.133.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.133.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.133.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.134.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.134.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.134.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.134.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.134.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.134.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.135.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.135.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.135.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.135.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.135.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.135.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.136.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.136.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.136.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.136.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.136.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.136.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.137.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.137.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.137.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.137.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.137.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.137.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.138.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.138.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.138.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.138.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.138.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.138.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.139.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.139.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.139.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.139.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.139.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.139.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.14.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.14.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.14.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.14.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.14.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.14.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.140.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.140.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.140.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.140.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.140.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.140.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.141.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.141.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.141.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.141.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.141.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.141.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.142.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.142.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.142.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.142.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.142.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.142.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.143.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.143.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.143.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.143.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.143.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.143.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.144.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.144.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.144.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.144.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.144.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.144.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.145.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.145.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.145.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.145.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.145.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.145.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.146.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.146.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.146.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.146.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.146.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.146.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.147.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.147.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.147.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.147.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.147.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.147.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.148.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.148.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.148.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.148.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.148.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.148.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.149.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.149.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.149.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.149.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.149.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.149.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.15.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.15.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.15.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.15.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.15.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.15.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.150.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.150.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.150.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.150.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.150.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.150.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.151.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.151.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.151.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.151.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.151.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.151.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.152.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.152.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.152.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.152.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.152.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.152.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.153.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.153.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.153.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.153.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.153.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.153.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.154.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.154.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.154.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.154.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.154.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.154.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.155.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.155.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.155.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.155.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.155.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.155.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.156.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.156.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.156.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.156.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.156.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.156.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.157.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.157.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.157.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.157.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.157.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.157.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.158.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.158.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.158.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.158.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.158.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.158.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.159.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.159.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.159.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.159.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.159.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.159.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.16.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.16.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.16.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.16.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.16.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.16.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.17.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.17.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.17.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.17.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.17.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.17.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.18.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.18.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.18.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.18.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.18.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.18.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.19.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.19.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.19.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.19.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.19.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.19.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.2.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.2.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.2.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.2.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.2.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.2.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.20.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.20.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.20.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.20.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.20.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.20.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.21.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.21.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.21.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.21.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.21.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.21.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.22.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.22.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.22.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.22.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.22.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.22.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.23.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.23.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.23.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.23.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.23.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.23.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.24.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.24.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.24.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.24.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.24.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.24.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.25.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.25.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.25.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.25.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.25.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.25.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.26.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.26.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.26.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.26.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.26.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.26.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.27.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.27.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.27.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.27.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.27.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.27.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.28.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.28.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.28.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.28.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.28.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.28.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.29.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.29.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.29.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.29.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.29.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.29.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.3.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.3.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.3.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.3.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.3.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.3.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.30.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.30.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.30.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.30.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.30.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.30.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.31.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.31.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.31.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.31.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.31.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.31.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.32.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.32.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.32.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.32.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.32.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.32.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.33.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.33.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.33.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.33.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.33.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.33.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.34.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.34.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.34.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.34.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.34.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.34.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.35.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.35.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.35.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.35.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.35.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.35.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.36.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.36.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.36.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.36.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.36.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.36.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.37.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.37.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.37.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.37.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.37.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.37.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.38.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.38.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.38.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.38.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.38.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.38.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.39.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.39.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.39.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.39.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.39.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.39.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.4.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.4.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.4.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.4.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.4.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.4.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.40.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.40.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.40.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.40.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.40.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.40.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.41.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.41.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.41.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.41.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.41.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.41.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.42.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.42.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.42.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.42.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.42.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.42.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.43.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.43.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.43.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.43.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.43.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.43.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.44.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.44.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.44.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.44.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.44.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.44.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.45.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.45.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.45.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.45.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.45.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.45.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.46.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.46.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.46.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.46.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.46.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.46.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.47.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.47.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.47.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.47.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.47.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.47.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.48.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.48.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.48.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.48.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.48.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.48.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.49.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.49.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.49.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.49.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.49.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.49.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.5.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.5.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.5.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.5.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.5.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.5.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.50.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.50.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.50.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.50.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.50.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.50.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.51.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.51.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.51.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.51.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.51.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.51.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.52.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.52.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.52.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.52.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.52.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.52.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.53.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.53.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.53.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.53.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.53.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.53.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.54.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.54.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.54.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.54.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.54.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.54.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.55.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.55.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.55.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.55.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.55.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.55.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.56.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.56.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.56.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.56.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.56.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.56.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.57.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.57.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.57.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.57.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.57.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.57.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.58.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.58.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.58.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.58.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.58.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.58.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.59.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.59.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.59.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.59.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.59.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.59.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.6.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.6.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.6.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.6.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.6.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.6.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.60.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.60.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.60.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.60.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.60.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.60.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.61.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.61.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.61.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.61.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.61.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.61.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.62.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.62.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.62.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.62.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.62.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.62.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.63.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.63.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.63.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.63.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.63.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.63.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.64.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.64.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.64.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.64.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.64.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.64.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.65.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.65.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.65.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.65.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.65.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.65.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.66.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.66.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.66.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.66.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.66.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.66.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.67.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.67.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.67.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.67.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.67.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.67.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.68.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.68.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.68.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.68.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.68.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.68.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.69.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.69.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.69.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.69.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.69.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.69.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.7.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.7.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.7.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.7.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.7.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.7.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.70.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.70.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.70.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.70.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.70.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.70.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.71.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.71.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.71.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.71.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.71.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.71.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.72.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.72.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.72.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.72.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.72.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.72.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.73.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.73.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.73.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.73.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.73.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.73.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.74.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.74.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.74.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.74.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.74.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.74.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.75.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.75.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.75.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.75.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.75.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.75.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.76.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.76.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.76.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.76.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.76.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.76.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.77.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.77.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.77.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.77.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.77.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.77.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.78.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.78.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.78.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.78.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.78.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.78.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.79.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.79.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.79.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.79.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.79.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.79.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.8.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.8.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.8.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.8.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.8.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.8.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.80.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.80.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.80.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.80.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.80.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.80.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.81.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.81.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.81.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.81.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.81.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.81.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.82.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.82.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.82.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.82.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.82.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.82.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.83.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.83.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.83.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.83.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.83.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.83.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.84.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.84.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.84.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.84.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.84.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.84.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.85.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.85.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.85.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.85.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.85.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.85.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.86.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.86.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.86.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.86.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.86.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.86.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.87.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.87.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.87.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.87.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.87.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.87.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.88.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.88.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.88.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.88.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.88.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.88.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.89.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.89.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.89.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.89.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.89.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.89.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.9.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.9.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.9.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.9.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.9.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.9.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.90.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.90.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.90.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.90.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.90.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.90.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.91.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.91.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.91.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.91.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.91.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.91.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.92.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.92.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.92.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.92.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.92.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.92.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.93.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.93.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.93.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.93.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.93.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.93.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.94.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.94.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.94.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.94.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.94.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.94.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.95.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.95.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.95.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.95.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.95.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.95.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.96.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.96.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.96.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.96.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.96.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.96.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.97.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.97.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.97.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.97.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.97.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.97.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.98.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.98.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.98.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.98.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.98.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.98.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.99.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.99.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.99.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.99.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.99.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.experts.99.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.gate.e_score_correction_bias": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.gate.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.shared_experts.down_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.shared_experts.down_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.shared_experts.gate_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.shared_experts.gate_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.shared_experts.up_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.mlp.shared_experts.up_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.post_attention_layernorm.weight": "model-00032-of-00092.safetensors", + "model.layers.31.self_attn.k_norm.weight": "model-00032-of-00092.safetensors", + "model.layers.31.self_attn.k_proj.bias": "model-00032-of-00092.safetensors", + "model.layers.31.self_attn.k_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.self_attn.k_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.self_attn.o_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.self_attn.o_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.self_attn.q_norm.weight": "model-00032-of-00092.safetensors", + "model.layers.31.self_attn.q_proj.bias": "model-00032-of-00092.safetensors", + "model.layers.31.self_attn.q_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.self_attn.q_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.31.self_attn.v_proj.bias": "model-00032-of-00092.safetensors", + "model.layers.31.self_attn.v_proj.weight": "model-00032-of-00092.safetensors", + "model.layers.31.self_attn.v_proj.weight_scale": "model-00032-of-00092.safetensors", + "model.layers.32.input_layernorm.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.0.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.0.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.0.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.0.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.0.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.0.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.1.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.1.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.1.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.1.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.1.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.1.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.10.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.10.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.10.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.10.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.10.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.10.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.100.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.100.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.100.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.100.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.100.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.100.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.101.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.101.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.101.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.101.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.101.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.101.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.102.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.102.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.102.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.102.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.102.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.102.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.103.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.103.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.103.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.103.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.103.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.103.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.104.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.104.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.104.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.104.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.104.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.104.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.105.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.105.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.105.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.105.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.105.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.105.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.106.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.106.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.106.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.106.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.106.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.106.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.107.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.107.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.107.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.107.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.107.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.107.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.108.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.108.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.108.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.108.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.108.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.108.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.109.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.109.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.109.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.109.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.109.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.109.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.11.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.11.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.11.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.11.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.11.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.11.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.110.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.110.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.110.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.110.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.110.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.110.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.111.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.111.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.111.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.111.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.111.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.111.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.112.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.112.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.112.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.112.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.112.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.112.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.113.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.113.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.113.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.113.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.113.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.113.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.114.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.114.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.114.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.114.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.114.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.114.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.115.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.115.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.115.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.115.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.115.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.115.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.116.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.116.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.116.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.116.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.116.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.116.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.117.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.117.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.117.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.117.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.117.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.117.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.118.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.118.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.118.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.118.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.118.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.118.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.119.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.119.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.119.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.119.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.119.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.119.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.12.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.12.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.12.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.12.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.12.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.12.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.120.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.120.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.120.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.120.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.120.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.120.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.121.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.121.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.121.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.121.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.121.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.121.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.122.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.122.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.122.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.122.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.122.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.122.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.123.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.123.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.123.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.123.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.123.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.123.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.124.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.124.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.124.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.124.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.124.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.124.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.125.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.125.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.125.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.125.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.125.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.125.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.126.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.126.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.126.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.126.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.126.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.126.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.127.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.127.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.127.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.127.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.127.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.127.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.128.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.128.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.128.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.128.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.128.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.128.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.129.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.129.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.129.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.129.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.129.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.129.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.13.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.13.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.13.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.13.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.13.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.13.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.130.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.130.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.130.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.130.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.130.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.130.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.131.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.131.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.131.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.131.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.131.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.131.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.132.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.132.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.132.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.132.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.132.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.132.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.133.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.133.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.133.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.133.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.133.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.133.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.134.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.134.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.134.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.134.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.134.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.134.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.135.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.135.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.135.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.135.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.135.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.135.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.136.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.136.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.136.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.136.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.136.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.136.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.137.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.137.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.137.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.137.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.137.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.137.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.138.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.138.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.138.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.138.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.138.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.138.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.139.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.139.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.139.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.139.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.139.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.139.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.14.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.14.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.14.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.14.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.14.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.14.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.140.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.140.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.140.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.140.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.140.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.140.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.141.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.141.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.141.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.141.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.141.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.141.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.142.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.142.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.142.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.142.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.142.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.142.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.143.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.143.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.143.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.143.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.143.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.143.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.144.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.144.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.144.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.144.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.144.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.144.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.145.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.145.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.145.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.145.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.145.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.145.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.146.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.146.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.146.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.146.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.146.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.146.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.147.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.147.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.147.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.147.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.147.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.147.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.148.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.148.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.148.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.148.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.148.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.148.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.149.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.149.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.149.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.149.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.149.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.149.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.15.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.15.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.15.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.15.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.15.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.15.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.150.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.150.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.150.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.150.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.150.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.150.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.151.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.151.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.151.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.151.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.151.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.151.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.152.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.152.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.152.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.152.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.152.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.152.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.153.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.153.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.153.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.153.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.153.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.153.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.154.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.154.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.154.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.154.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.154.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.154.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.155.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.155.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.155.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.155.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.155.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.155.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.156.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.156.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.156.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.156.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.156.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.156.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.157.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.157.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.157.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.157.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.157.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.157.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.158.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.158.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.158.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.158.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.158.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.158.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.159.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.159.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.159.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.159.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.159.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.159.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.16.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.16.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.16.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.16.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.16.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.16.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.17.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.17.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.17.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.17.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.17.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.17.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.18.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.18.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.18.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.18.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.18.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.18.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.19.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.19.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.19.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.19.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.19.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.19.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.2.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.2.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.2.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.2.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.2.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.2.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.20.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.20.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.20.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.20.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.20.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.20.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.21.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.21.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.21.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.21.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.21.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.21.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.22.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.22.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.22.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.22.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.22.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.22.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.23.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.23.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.23.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.23.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.23.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.23.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.24.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.24.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.24.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.24.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.24.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.24.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.25.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.25.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.25.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.25.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.25.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.25.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.26.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.26.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.26.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.26.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.26.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.26.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.27.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.27.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.27.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.27.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.27.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.27.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.28.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.28.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.28.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.28.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.28.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.28.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.29.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.29.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.29.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.29.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.29.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.29.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.3.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.3.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.3.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.3.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.3.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.3.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.30.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.30.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.30.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.30.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.30.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.30.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.31.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.31.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.31.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.31.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.31.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.31.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.32.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.32.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.32.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.32.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.32.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.32.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.33.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.33.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.33.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.33.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.33.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.33.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.34.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.34.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.34.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.34.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.34.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.34.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.35.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.35.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.35.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.35.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.35.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.35.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.36.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.36.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.36.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.36.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.36.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.36.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.37.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.37.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.37.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.37.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.37.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.37.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.38.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.38.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.38.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.38.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.38.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.38.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.39.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.39.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.39.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.39.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.39.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.39.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.4.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.4.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.4.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.4.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.4.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.4.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.40.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.40.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.40.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.40.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.40.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.40.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.41.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.41.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.41.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.41.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.41.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.41.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.42.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.42.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.42.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.42.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.42.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.42.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.43.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.43.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.43.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.43.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.43.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.43.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.44.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.44.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.44.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.44.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.44.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.44.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.45.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.45.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.45.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.45.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.45.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.45.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.46.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.46.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.46.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.46.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.46.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.46.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.47.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.47.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.47.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.47.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.47.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.47.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.48.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.48.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.48.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.48.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.48.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.48.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.49.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.49.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.49.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.49.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.49.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.49.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.5.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.5.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.5.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.5.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.5.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.5.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.50.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.50.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.50.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.50.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.50.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.50.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.51.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.51.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.51.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.51.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.51.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.51.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.52.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.52.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.52.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.52.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.52.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.52.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.53.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.53.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.53.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.53.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.53.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.53.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.54.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.54.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.54.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.54.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.54.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.54.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.55.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.55.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.55.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.55.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.55.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.55.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.56.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.56.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.56.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.56.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.56.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.56.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.57.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.57.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.57.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.57.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.57.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.57.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.58.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.58.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.58.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.58.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.58.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.58.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.59.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.59.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.59.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.59.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.59.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.59.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.6.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.6.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.6.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.6.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.6.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.6.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.60.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.60.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.60.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.60.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.60.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.60.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.61.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.61.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.61.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.61.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.61.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.61.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.62.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.62.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.62.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.62.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.62.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.62.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.63.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.63.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.63.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.63.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.63.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.63.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.64.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.64.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.64.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.64.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.64.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.64.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.65.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.65.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.65.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.65.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.65.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.65.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.66.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.66.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.66.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.66.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.66.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.66.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.67.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.67.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.67.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.67.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.67.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.67.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.68.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.68.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.68.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.68.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.68.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.68.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.69.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.69.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.69.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.69.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.69.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.69.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.7.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.7.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.7.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.7.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.7.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.7.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.70.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.70.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.70.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.70.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.70.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.70.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.71.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.71.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.71.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.71.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.71.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.71.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.72.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.72.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.72.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.72.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.72.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.72.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.73.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.73.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.73.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.73.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.73.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.73.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.74.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.74.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.74.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.74.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.74.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.74.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.75.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.75.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.75.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.75.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.75.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.75.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.76.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.76.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.76.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.76.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.76.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.76.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.77.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.77.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.77.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.77.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.77.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.77.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.78.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.78.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.78.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.78.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.78.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.78.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.79.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.79.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.79.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.79.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.79.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.79.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.8.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.8.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.8.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.8.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.8.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.8.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.80.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.80.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.80.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.80.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.80.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.80.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.81.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.81.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.81.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.81.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.81.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.81.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.82.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.82.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.82.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.82.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.82.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.82.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.83.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.83.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.83.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.83.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.83.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.83.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.84.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.84.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.84.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.84.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.84.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.84.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.85.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.85.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.85.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.85.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.85.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.85.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.86.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.86.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.86.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.86.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.86.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.86.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.87.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.87.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.87.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.87.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.87.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.87.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.88.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.88.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.88.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.88.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.88.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.88.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.89.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.89.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.89.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.89.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.89.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.89.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.9.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.9.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.9.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.9.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.9.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.9.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.90.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.90.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.90.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.90.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.90.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.90.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.91.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.91.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.91.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.91.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.91.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.91.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.92.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.92.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.92.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.92.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.92.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.92.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.93.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.93.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.93.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.93.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.93.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.93.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.94.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.94.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.94.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.94.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.94.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.94.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.95.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.95.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.95.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.95.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.95.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.95.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.96.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.96.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.96.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.96.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.96.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.96.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.97.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.97.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.97.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.97.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.97.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.97.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.98.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.98.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.98.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.98.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.98.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.98.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.99.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.99.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.99.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.99.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.99.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.experts.99.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.gate.e_score_correction_bias": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.gate.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.shared_experts.down_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.shared_experts.down_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.shared_experts.gate_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.shared_experts.gate_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.shared_experts.up_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.mlp.shared_experts.up_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.post_attention_layernorm.weight": "model-00033-of-00092.safetensors", + "model.layers.32.self_attn.k_norm.weight": "model-00033-of-00092.safetensors", + "model.layers.32.self_attn.k_proj.bias": "model-00033-of-00092.safetensors", + "model.layers.32.self_attn.k_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.self_attn.k_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.self_attn.o_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.self_attn.o_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.self_attn.q_norm.weight": "model-00033-of-00092.safetensors", + "model.layers.32.self_attn.q_proj.bias": "model-00033-of-00092.safetensors", + "model.layers.32.self_attn.q_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.self_attn.q_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.32.self_attn.v_proj.bias": "model-00033-of-00092.safetensors", + "model.layers.32.self_attn.v_proj.weight": "model-00033-of-00092.safetensors", + "model.layers.32.self_attn.v_proj.weight_scale": "model-00033-of-00092.safetensors", + "model.layers.33.input_layernorm.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.0.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.0.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.0.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.0.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.0.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.0.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.1.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.1.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.1.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.1.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.1.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.1.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.10.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.10.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.10.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.10.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.10.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.10.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.100.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.100.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.100.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.100.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.100.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.100.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.101.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.101.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.101.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.101.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.101.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.101.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.102.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.102.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.102.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.102.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.102.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.102.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.103.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.103.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.103.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.103.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.103.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.103.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.104.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.104.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.104.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.104.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.104.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.104.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.105.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.105.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.105.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.105.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.105.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.105.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.106.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.106.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.106.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.106.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.106.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.106.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.107.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.107.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.107.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.107.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.107.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.107.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.108.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.108.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.108.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.108.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.108.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.108.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.109.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.109.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.109.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.109.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.109.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.109.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.11.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.11.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.11.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.11.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.11.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.11.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.110.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.110.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.110.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.110.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.110.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.110.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.111.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.111.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.111.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.111.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.111.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.111.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.112.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.112.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.112.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.112.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.112.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.112.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.113.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.113.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.113.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.113.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.113.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.113.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.114.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.114.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.114.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.114.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.114.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.114.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.115.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.115.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.115.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.115.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.115.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.115.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.116.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.116.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.116.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.116.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.116.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.116.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.117.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.117.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.117.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.117.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.117.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.117.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.118.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.118.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.118.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.118.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.118.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.118.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.119.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.119.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.119.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.119.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.119.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.119.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.12.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.12.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.12.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.12.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.12.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.12.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.120.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.120.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.120.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.120.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.120.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.120.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.121.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.121.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.121.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.121.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.121.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.121.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.122.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.122.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.122.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.122.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.122.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.122.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.123.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.123.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.123.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.123.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.123.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.123.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.124.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.124.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.124.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.124.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.124.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.124.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.125.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.125.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.125.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.125.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.125.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.125.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.126.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.126.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.126.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.126.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.126.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.126.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.127.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.127.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.127.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.127.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.127.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.127.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.128.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.128.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.128.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.128.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.128.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.128.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.129.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.129.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.129.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.129.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.129.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.129.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.13.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.13.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.13.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.13.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.13.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.13.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.130.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.130.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.130.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.130.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.130.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.130.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.131.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.131.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.131.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.131.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.131.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.131.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.132.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.132.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.132.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.132.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.132.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.132.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.133.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.133.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.133.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.133.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.133.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.133.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.134.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.134.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.134.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.134.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.134.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.134.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.135.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.135.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.135.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.135.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.135.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.135.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.136.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.136.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.136.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.136.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.136.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.136.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.137.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.137.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.137.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.137.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.137.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.137.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.138.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.138.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.138.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.138.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.138.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.138.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.139.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.139.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.139.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.139.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.139.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.139.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.14.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.14.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.14.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.14.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.14.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.14.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.140.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.140.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.140.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.140.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.140.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.140.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.141.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.141.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.141.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.141.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.141.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.141.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.142.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.142.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.142.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.142.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.142.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.142.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.143.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.143.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.143.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.143.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.143.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.143.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.144.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.144.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.144.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.144.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.144.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.144.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.145.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.145.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.145.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.145.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.145.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.145.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.146.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.146.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.146.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.146.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.146.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.146.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.147.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.147.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.147.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.147.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.147.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.147.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.148.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.148.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.148.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.148.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.148.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.148.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.149.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.149.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.149.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.149.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.149.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.149.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.15.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.15.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.15.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.15.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.15.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.15.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.150.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.150.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.150.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.150.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.150.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.150.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.151.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.151.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.151.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.151.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.151.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.151.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.152.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.152.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.152.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.152.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.152.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.152.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.153.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.153.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.153.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.153.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.153.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.153.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.154.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.154.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.154.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.154.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.154.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.154.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.155.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.155.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.155.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.155.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.155.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.155.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.156.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.156.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.156.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.156.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.156.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.156.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.157.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.157.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.157.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.157.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.157.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.157.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.158.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.158.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.158.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.158.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.158.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.158.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.159.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.159.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.159.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.159.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.159.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.159.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.16.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.16.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.16.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.16.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.16.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.16.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.17.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.17.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.17.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.17.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.17.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.17.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.18.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.18.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.18.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.18.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.18.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.18.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.19.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.19.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.19.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.19.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.19.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.19.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.2.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.2.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.2.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.2.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.2.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.2.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.20.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.20.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.20.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.20.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.20.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.20.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.21.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.21.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.21.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.21.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.21.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.21.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.22.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.22.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.22.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.22.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.22.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.22.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.23.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.23.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.23.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.23.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.23.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.23.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.24.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.24.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.24.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.24.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.24.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.24.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.25.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.25.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.25.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.25.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.25.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.25.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.26.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.26.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.26.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.26.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.26.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.26.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.27.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.27.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.27.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.27.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.27.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.27.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.28.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.28.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.28.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.28.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.28.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.28.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.29.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.29.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.29.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.29.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.29.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.29.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.3.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.3.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.3.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.3.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.3.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.3.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.30.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.30.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.30.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.30.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.30.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.30.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.31.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.31.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.31.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.31.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.31.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.31.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.32.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.32.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.32.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.32.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.32.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.32.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.33.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.33.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.33.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.33.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.33.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.33.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.34.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.34.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.34.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.34.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.34.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.34.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.35.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.35.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.35.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.35.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.35.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.35.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.36.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.36.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.36.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.36.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.36.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.36.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.37.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.37.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.37.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.37.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.37.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.37.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.38.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.38.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.38.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.38.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.38.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.38.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.39.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.39.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.39.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.39.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.39.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.39.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.4.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.4.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.4.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.4.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.4.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.4.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.40.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.40.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.40.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.40.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.40.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.40.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.41.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.41.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.41.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.41.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.41.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.41.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.42.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.42.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.42.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.42.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.42.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.42.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.43.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.43.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.43.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.43.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.43.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.43.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.44.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.44.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.44.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.44.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.44.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.44.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.45.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.45.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.45.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.45.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.45.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.45.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.46.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.46.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.46.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.46.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.46.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.46.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.47.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.47.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.47.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.47.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.47.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.47.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.48.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.48.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.48.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.48.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.48.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.48.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.49.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.49.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.49.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.49.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.49.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.49.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.5.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.5.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.5.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.5.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.5.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.5.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.50.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.50.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.50.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.50.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.50.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.50.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.51.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.51.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.51.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.51.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.51.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.51.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.52.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.52.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.52.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.52.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.52.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.52.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.53.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.53.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.53.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.53.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.53.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.53.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.54.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.54.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.54.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.54.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.54.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.54.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.55.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.55.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.55.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.55.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.55.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.55.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.56.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.56.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.56.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.56.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.56.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.56.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.57.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.57.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.57.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.57.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.57.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.57.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.58.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.58.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.58.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.58.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.58.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.58.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.59.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.59.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.59.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.59.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.59.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.59.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.6.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.6.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.6.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.6.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.6.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.6.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.60.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.60.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.60.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.60.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.60.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.60.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.61.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.61.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.61.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.61.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.61.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.61.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.62.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.62.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.62.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.62.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.62.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.62.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.63.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.63.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.63.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.63.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.63.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.63.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.64.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.64.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.64.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.64.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.64.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.64.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.65.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.65.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.65.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.65.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.65.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.65.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.66.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.66.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.66.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.66.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.66.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.66.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.67.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.67.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.67.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.67.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.67.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.67.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.68.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.68.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.68.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.68.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.68.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.68.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.69.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.69.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.69.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.69.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.69.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.69.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.7.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.7.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.7.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.7.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.7.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.7.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.70.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.70.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.70.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.70.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.70.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.70.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.71.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.71.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.71.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.71.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.71.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.71.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.72.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.72.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.72.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.72.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.72.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.72.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.73.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.73.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.73.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.73.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.73.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.73.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.74.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.74.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.74.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.74.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.74.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.74.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.75.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.75.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.75.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.75.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.75.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.75.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.76.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.76.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.76.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.76.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.76.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.76.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.77.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.77.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.77.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.77.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.77.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.77.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.78.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.78.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.78.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.78.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.78.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.78.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.79.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.79.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.79.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.79.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.79.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.79.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.8.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.8.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.8.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.8.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.8.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.8.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.80.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.80.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.80.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.80.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.80.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.80.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.81.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.81.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.81.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.81.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.81.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.81.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.82.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.82.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.82.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.82.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.82.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.82.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.83.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.83.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.83.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.83.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.83.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.83.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.84.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.84.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.84.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.84.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.84.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.84.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.85.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.85.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.85.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.85.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.85.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.85.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.86.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.86.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.86.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.86.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.86.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.86.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.87.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.87.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.87.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.87.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.87.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.87.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.88.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.88.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.88.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.88.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.88.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.88.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.89.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.89.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.89.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.89.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.89.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.89.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.9.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.9.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.9.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.9.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.9.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.9.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.90.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.90.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.90.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.90.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.90.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.90.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.91.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.91.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.91.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.91.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.91.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.91.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.92.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.92.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.92.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.92.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.92.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.92.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.93.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.93.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.93.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.93.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.93.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.93.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.94.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.94.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.94.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.94.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.94.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.94.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.95.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.95.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.95.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.95.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.95.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.95.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.96.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.96.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.96.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.96.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.96.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.96.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.97.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.97.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.97.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.97.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.97.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.97.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.98.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.98.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.98.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.98.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.98.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.98.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.99.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.99.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.99.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.99.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.99.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.experts.99.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.gate.e_score_correction_bias": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.gate.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.shared_experts.down_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.shared_experts.down_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.shared_experts.gate_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.shared_experts.gate_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.shared_experts.up_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.mlp.shared_experts.up_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.post_attention_layernorm.weight": "model-00034-of-00092.safetensors", + "model.layers.33.self_attn.k_norm.weight": "model-00034-of-00092.safetensors", + "model.layers.33.self_attn.k_proj.bias": "model-00034-of-00092.safetensors", + "model.layers.33.self_attn.k_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.self_attn.k_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.self_attn.o_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.self_attn.o_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.self_attn.q_norm.weight": "model-00034-of-00092.safetensors", + "model.layers.33.self_attn.q_proj.bias": "model-00034-of-00092.safetensors", + "model.layers.33.self_attn.q_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.self_attn.q_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.33.self_attn.v_proj.bias": "model-00034-of-00092.safetensors", + "model.layers.33.self_attn.v_proj.weight": "model-00034-of-00092.safetensors", + "model.layers.33.self_attn.v_proj.weight_scale": "model-00034-of-00092.safetensors", + "model.layers.34.input_layernorm.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.0.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.0.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.0.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.0.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.0.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.0.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.1.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.1.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.1.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.1.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.1.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.1.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.10.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.10.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.10.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.10.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.10.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.10.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.100.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.100.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.100.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.100.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.100.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.100.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.101.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.101.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.101.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.101.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.101.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.101.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.102.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.102.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.102.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.102.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.102.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.102.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.103.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.103.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.103.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.103.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.103.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.103.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.104.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.104.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.104.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.104.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.104.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.104.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.105.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.105.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.105.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.105.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.105.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.105.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.106.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.106.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.106.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.106.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.106.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.106.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.107.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.107.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.107.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.107.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.107.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.107.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.108.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.108.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.108.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.108.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.108.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.108.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.109.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.109.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.109.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.109.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.109.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.109.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.11.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.11.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.11.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.11.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.11.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.11.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.110.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.110.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.110.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.110.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.110.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.110.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.111.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.111.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.111.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.111.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.111.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.111.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.112.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.112.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.112.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.112.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.112.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.112.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.113.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.113.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.113.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.113.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.113.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.113.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.114.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.114.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.114.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.114.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.114.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.114.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.115.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.115.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.115.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.115.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.115.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.115.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.116.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.116.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.116.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.116.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.116.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.116.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.117.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.117.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.117.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.117.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.117.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.117.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.118.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.118.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.118.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.118.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.118.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.118.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.119.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.119.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.119.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.119.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.119.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.119.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.12.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.12.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.12.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.12.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.12.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.12.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.120.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.120.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.120.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.120.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.120.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.120.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.121.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.121.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.121.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.121.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.121.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.121.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.122.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.122.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.122.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.122.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.122.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.122.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.123.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.123.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.123.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.123.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.123.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.123.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.124.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.124.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.124.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.124.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.124.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.124.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.125.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.125.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.125.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.125.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.125.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.125.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.126.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.126.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.126.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.126.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.126.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.126.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.127.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.127.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.127.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.127.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.127.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.127.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.128.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.128.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.128.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.128.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.128.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.128.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.129.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.129.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.129.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.129.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.129.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.129.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.13.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.13.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.13.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.13.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.13.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.13.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.130.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.130.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.130.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.130.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.130.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.130.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.131.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.131.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.131.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.131.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.131.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.131.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.132.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.132.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.132.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.132.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.132.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.132.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.133.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.133.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.133.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.133.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.133.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.133.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.134.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.134.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.134.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.134.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.134.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.134.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.135.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.135.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.135.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.135.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.135.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.135.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.136.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.136.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.136.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.136.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.136.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.136.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.137.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.137.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.137.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.137.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.137.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.137.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.138.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.138.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.138.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.138.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.138.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.138.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.139.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.139.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.139.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.139.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.139.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.139.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.14.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.14.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.14.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.14.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.14.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.14.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.140.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.140.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.140.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.140.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.140.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.140.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.141.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.141.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.141.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.141.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.141.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.141.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.142.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.142.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.142.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.142.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.142.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.142.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.143.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.143.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.143.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.143.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.143.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.143.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.144.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.144.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.144.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.144.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.144.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.144.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.145.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.145.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.145.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.145.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.145.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.145.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.146.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.146.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.146.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.146.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.146.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.146.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.147.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.147.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.147.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.147.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.147.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.147.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.148.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.148.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.148.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.148.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.148.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.148.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.149.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.149.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.149.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.149.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.149.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.149.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.15.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.15.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.15.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.15.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.15.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.15.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.150.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.150.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.150.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.150.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.150.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.150.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.151.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.151.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.151.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.151.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.151.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.151.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.152.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.152.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.152.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.152.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.152.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.152.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.153.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.153.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.153.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.153.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.153.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.153.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.154.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.154.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.154.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.154.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.154.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.154.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.155.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.155.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.155.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.155.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.155.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.155.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.156.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.156.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.156.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.156.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.156.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.156.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.157.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.157.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.157.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.157.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.157.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.157.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.158.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.158.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.158.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.158.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.158.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.158.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.159.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.159.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.159.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.159.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.159.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.159.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.16.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.16.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.16.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.16.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.16.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.16.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.17.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.17.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.17.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.17.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.17.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.17.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.18.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.18.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.18.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.18.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.18.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.18.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.19.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.19.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.19.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.19.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.19.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.19.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.2.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.2.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.2.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.2.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.2.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.2.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.20.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.20.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.20.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.20.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.20.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.20.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.21.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.21.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.21.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.21.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.21.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.21.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.22.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.22.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.22.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.22.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.22.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.22.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.23.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.23.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.23.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.23.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.23.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.23.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.24.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.24.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.24.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.24.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.24.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.24.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.25.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.25.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.25.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.25.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.25.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.25.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.26.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.26.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.26.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.26.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.26.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.26.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.27.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.27.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.27.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.27.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.27.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.27.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.28.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.28.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.28.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.28.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.28.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.28.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.29.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.29.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.29.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.29.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.29.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.29.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.3.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.3.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.3.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.3.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.3.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.3.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.30.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.30.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.30.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.30.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.30.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.30.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.31.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.31.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.31.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.31.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.31.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.31.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.32.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.32.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.32.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.32.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.32.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.32.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.33.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.33.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.33.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.33.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.33.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.33.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.34.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.34.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.34.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.34.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.34.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.34.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.35.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.35.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.35.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.35.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.35.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.35.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.36.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.36.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.36.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.36.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.36.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.36.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.37.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.37.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.37.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.37.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.37.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.37.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.38.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.38.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.38.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.38.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.38.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.38.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.39.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.39.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.39.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.39.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.39.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.39.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.4.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.4.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.4.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.4.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.4.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.4.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.40.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.40.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.40.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.40.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.40.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.40.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.41.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.41.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.41.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.41.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.41.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.41.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.42.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.42.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.42.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.42.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.42.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.42.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.43.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.43.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.43.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.43.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.43.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.43.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.44.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.44.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.44.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.44.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.44.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.44.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.45.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.45.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.45.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.45.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.45.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.45.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.46.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.46.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.46.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.46.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.46.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.46.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.47.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.47.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.47.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.47.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.47.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.47.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.48.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.48.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.48.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.48.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.48.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.48.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.49.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.49.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.49.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.49.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.49.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.49.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.5.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.5.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.5.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.5.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.5.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.5.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.50.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.50.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.50.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.50.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.50.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.50.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.51.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.51.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.51.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.51.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.51.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.51.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.52.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.52.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.52.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.52.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.52.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.52.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.53.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.53.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.53.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.53.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.53.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.53.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.54.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.54.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.54.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.54.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.54.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.54.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.55.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.55.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.55.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.55.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.55.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.55.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.56.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.56.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.56.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.56.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.56.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.56.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.57.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.57.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.57.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.57.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.57.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.57.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.58.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.58.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.58.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.58.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.58.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.58.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.59.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.59.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.59.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.59.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.59.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.59.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.6.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.6.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.6.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.6.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.6.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.6.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.60.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.60.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.60.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.60.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.60.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.60.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.61.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.61.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.61.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.61.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.61.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.61.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.62.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.62.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.62.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.62.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.62.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.62.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.63.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.63.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.63.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.63.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.63.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.63.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.64.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.64.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.64.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.64.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.64.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.64.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.65.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.65.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.65.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.65.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.65.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.65.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.66.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.66.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.66.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.66.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.66.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.66.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.67.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.67.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.67.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.67.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.67.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.67.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.68.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.68.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.68.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.68.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.68.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.68.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.69.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.69.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.69.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.69.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.69.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.69.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.7.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.7.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.7.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.7.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.7.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.7.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.70.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.70.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.70.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.70.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.70.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.70.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.71.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.71.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.71.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.71.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.71.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.71.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.72.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.72.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.72.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.72.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.72.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.72.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.73.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.73.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.73.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.73.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.73.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.73.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.74.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.74.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.74.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.74.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.74.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.74.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.75.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.75.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.75.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.75.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.75.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.75.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.76.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.76.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.76.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.76.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.76.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.76.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.77.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.77.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.77.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.77.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.77.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.77.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.78.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.78.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.78.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.78.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.78.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.78.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.79.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.79.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.79.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.79.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.79.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.79.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.8.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.8.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.8.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.8.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.8.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.8.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.80.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.80.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.80.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.80.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.80.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.80.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.81.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.81.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.81.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.81.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.81.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.81.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.82.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.82.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.82.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.82.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.82.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.82.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.83.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.83.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.83.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.83.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.83.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.83.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.84.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.84.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.84.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.84.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.84.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.84.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.85.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.85.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.85.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.85.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.85.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.85.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.86.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.86.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.86.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.86.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.86.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.86.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.87.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.87.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.87.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.87.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.87.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.87.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.88.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.88.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.88.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.88.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.88.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.88.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.89.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.89.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.89.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.89.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.89.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.89.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.9.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.9.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.9.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.9.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.9.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.9.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.90.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.90.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.90.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.90.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.90.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.90.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.91.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.91.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.91.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.91.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.91.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.91.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.92.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.92.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.92.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.92.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.92.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.92.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.93.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.93.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.93.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.93.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.93.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.93.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.94.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.94.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.94.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.94.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.94.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.94.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.95.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.95.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.95.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.95.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.95.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.95.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.96.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.96.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.96.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.96.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.96.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.96.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.97.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.97.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.97.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.97.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.97.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.97.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.98.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.98.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.98.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.98.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.98.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.98.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.99.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.99.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.99.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.99.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.99.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.experts.99.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.gate.e_score_correction_bias": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.gate.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.shared_experts.down_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.shared_experts.down_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.shared_experts.gate_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.shared_experts.gate_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.shared_experts.up_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.mlp.shared_experts.up_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.post_attention_layernorm.weight": "model-00035-of-00092.safetensors", + "model.layers.34.self_attn.k_norm.weight": "model-00035-of-00092.safetensors", + "model.layers.34.self_attn.k_proj.bias": "model-00035-of-00092.safetensors", + "model.layers.34.self_attn.k_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.self_attn.k_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.self_attn.o_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.self_attn.o_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.self_attn.q_norm.weight": "model-00035-of-00092.safetensors", + "model.layers.34.self_attn.q_proj.bias": "model-00035-of-00092.safetensors", + "model.layers.34.self_attn.q_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.self_attn.q_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.34.self_attn.v_proj.bias": "model-00035-of-00092.safetensors", + "model.layers.34.self_attn.v_proj.weight": "model-00035-of-00092.safetensors", + "model.layers.34.self_attn.v_proj.weight_scale": "model-00035-of-00092.safetensors", + "model.layers.35.input_layernorm.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.0.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.0.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.0.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.0.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.0.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.0.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.1.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.1.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.1.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.1.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.1.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.1.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.10.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.10.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.10.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.10.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.10.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.10.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.100.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.100.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.100.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.100.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.100.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.100.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.101.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.101.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.101.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.101.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.101.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.101.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.102.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.102.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.102.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.102.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.102.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.102.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.103.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.103.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.103.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.103.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.103.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.103.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.104.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.104.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.104.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.104.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.104.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.104.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.105.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.105.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.105.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.105.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.105.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.105.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.106.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.106.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.106.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.106.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.106.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.106.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.107.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.107.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.107.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.107.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.107.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.107.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.108.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.108.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.108.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.108.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.108.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.108.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.109.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.109.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.109.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.109.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.109.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.109.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.11.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.11.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.11.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.11.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.11.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.11.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.110.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.110.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.110.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.110.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.110.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.110.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.111.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.111.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.111.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.111.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.111.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.111.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.112.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.112.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.112.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.112.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.112.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.112.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.113.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.113.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.113.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.113.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.113.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.113.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.114.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.114.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.114.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.114.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.114.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.114.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.115.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.115.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.115.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.115.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.115.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.115.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.116.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.116.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.116.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.116.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.116.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.116.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.117.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.117.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.117.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.117.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.117.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.117.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.118.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.118.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.118.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.118.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.118.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.118.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.119.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.119.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.119.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.119.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.119.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.119.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.12.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.12.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.12.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.12.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.12.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.12.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.120.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.120.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.120.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.120.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.120.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.120.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.121.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.121.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.121.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.121.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.121.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.121.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.122.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.122.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.122.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.122.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.122.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.122.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.123.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.123.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.123.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.123.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.123.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.123.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.124.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.124.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.124.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.124.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.124.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.124.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.125.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.125.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.125.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.125.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.125.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.125.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.126.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.126.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.126.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.126.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.126.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.126.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.127.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.127.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.127.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.127.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.127.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.127.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.128.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.128.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.128.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.128.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.128.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.128.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.129.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.129.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.129.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.129.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.129.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.129.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.13.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.13.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.13.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.13.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.13.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.13.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.130.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.130.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.130.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.130.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.130.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.130.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.131.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.131.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.131.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.131.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.131.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.131.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.132.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.132.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.132.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.132.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.132.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.132.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.133.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.133.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.133.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.133.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.133.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.133.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.134.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.134.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.134.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.134.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.134.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.134.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.135.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.135.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.135.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.135.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.135.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.135.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.136.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.136.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.136.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.136.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.136.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.136.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.137.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.137.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.137.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.137.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.137.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.137.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.138.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.138.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.138.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.138.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.138.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.138.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.139.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.139.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.139.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.139.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.139.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.139.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.14.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.14.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.14.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.14.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.14.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.14.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.140.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.140.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.140.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.140.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.140.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.140.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.141.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.141.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.141.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.141.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.141.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.141.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.142.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.142.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.142.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.142.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.142.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.142.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.143.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.143.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.143.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.143.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.143.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.143.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.144.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.144.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.144.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.144.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.144.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.144.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.145.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.145.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.145.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.145.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.145.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.145.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.146.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.146.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.146.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.146.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.146.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.146.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.147.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.147.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.147.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.147.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.147.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.147.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.148.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.148.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.148.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.148.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.148.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.148.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.149.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.149.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.149.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.149.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.149.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.149.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.15.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.15.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.15.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.15.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.15.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.15.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.150.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.150.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.150.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.150.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.150.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.150.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.151.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.151.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.151.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.151.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.151.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.151.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.152.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.152.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.152.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.152.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.152.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.152.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.153.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.153.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.153.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.153.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.153.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.153.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.154.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.154.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.154.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.154.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.154.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.154.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.155.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.155.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.155.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.155.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.155.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.155.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.156.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.156.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.156.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.156.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.156.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.156.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.157.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.157.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.157.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.157.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.157.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.157.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.158.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.158.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.158.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.158.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.158.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.158.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.159.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.159.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.159.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.159.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.159.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.159.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.16.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.16.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.16.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.16.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.16.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.16.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.17.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.17.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.17.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.17.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.17.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.17.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.18.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.18.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.18.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.18.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.18.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.18.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.19.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.19.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.19.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.19.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.19.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.19.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.2.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.2.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.2.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.2.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.2.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.2.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.20.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.20.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.20.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.20.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.20.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.20.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.21.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.21.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.21.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.21.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.21.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.21.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.22.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.22.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.22.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.22.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.22.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.22.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.23.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.23.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.23.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.23.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.23.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.23.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.24.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.24.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.24.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.24.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.24.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.24.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.25.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.25.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.25.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.25.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.25.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.25.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.26.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.26.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.26.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.26.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.26.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.26.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.27.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.27.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.27.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.27.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.27.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.27.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.28.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.28.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.28.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.28.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.28.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.28.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.29.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.29.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.29.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.29.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.29.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.29.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.3.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.3.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.3.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.3.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.3.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.3.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.30.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.30.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.30.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.30.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.30.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.30.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.31.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.31.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.31.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.31.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.31.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.31.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.32.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.32.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.32.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.32.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.32.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.32.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.33.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.33.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.33.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.33.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.33.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.33.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.34.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.34.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.34.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.34.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.34.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.34.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.35.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.35.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.35.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.35.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.35.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.35.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.36.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.36.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.36.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.36.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.36.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.36.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.37.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.37.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.37.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.37.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.37.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.37.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.38.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.38.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.38.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.38.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.38.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.38.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.39.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.39.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.39.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.39.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.39.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.39.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.4.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.4.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.4.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.4.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.4.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.4.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.40.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.40.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.40.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.40.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.40.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.40.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.41.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.41.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.41.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.41.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.41.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.41.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.42.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.42.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.42.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.42.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.42.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.42.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.43.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.43.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.43.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.43.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.43.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.43.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.44.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.44.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.44.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.44.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.44.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.44.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.45.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.45.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.45.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.45.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.45.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.45.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.46.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.46.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.46.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.46.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.46.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.46.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.47.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.47.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.47.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.47.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.47.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.47.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.48.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.48.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.48.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.48.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.48.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.48.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.49.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.49.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.49.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.49.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.49.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.49.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.5.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.5.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.5.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.5.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.5.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.5.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.50.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.50.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.50.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.50.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.50.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.50.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.51.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.51.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.51.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.51.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.51.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.51.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.52.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.52.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.52.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.52.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.52.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.52.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.53.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.53.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.53.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.53.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.53.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.53.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.54.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.54.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.54.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.54.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.54.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.54.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.55.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.55.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.55.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.55.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.55.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.55.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.56.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.56.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.56.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.56.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.56.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.56.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.57.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.57.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.57.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.57.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.57.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.57.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.58.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.58.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.58.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.58.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.58.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.58.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.59.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.59.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.59.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.59.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.59.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.59.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.6.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.6.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.6.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.6.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.6.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.6.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.60.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.60.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.60.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.60.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.60.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.60.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.61.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.61.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.61.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.61.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.61.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.61.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.62.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.62.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.62.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.62.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.62.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.62.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.63.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.63.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.63.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.63.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.63.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.63.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.64.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.64.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.64.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.64.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.64.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.64.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.65.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.65.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.65.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.65.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.65.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.65.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.66.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.66.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.66.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.66.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.66.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.66.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.67.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.67.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.67.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.67.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.67.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.67.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.68.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.68.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.68.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.68.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.68.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.68.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.69.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.69.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.69.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.69.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.69.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.69.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.7.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.7.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.7.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.7.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.7.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.7.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.70.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.70.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.70.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.70.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.70.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.70.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.71.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.71.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.71.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.71.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.71.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.71.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.72.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.72.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.72.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.72.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.72.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.72.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.73.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.73.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.73.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.73.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.73.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.73.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.74.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.74.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.74.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.74.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.74.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.74.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.75.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.75.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.75.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.75.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.75.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.75.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.76.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.76.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.76.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.76.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.76.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.76.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.77.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.77.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.77.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.77.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.77.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.77.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.78.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.78.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.78.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.78.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.78.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.78.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.79.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.79.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.79.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.79.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.79.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.79.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.8.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.8.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.8.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.8.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.8.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.8.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.80.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.80.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.80.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.80.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.80.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.80.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.81.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.81.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.81.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.81.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.81.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.81.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.82.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.82.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.82.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.82.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.82.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.82.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.83.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.83.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.83.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.83.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.83.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.83.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.84.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.84.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.84.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.84.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.84.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.84.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.85.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.85.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.85.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.85.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.85.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.85.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.86.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.86.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.86.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.86.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.86.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.86.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.87.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.87.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.87.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.87.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.87.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.87.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.88.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.88.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.88.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.88.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.88.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.88.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.89.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.89.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.89.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.89.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.89.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.89.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.9.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.9.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.9.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.9.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.9.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.9.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.90.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.90.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.90.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.90.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.90.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.90.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.91.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.91.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.91.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.91.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.91.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.91.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.92.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.92.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.92.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.92.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.92.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.92.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.93.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.93.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.93.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.93.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.93.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.93.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.94.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.94.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.94.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.94.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.94.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.94.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.95.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.95.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.95.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.95.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.95.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.95.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.96.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.96.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.96.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.96.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.96.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.96.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.97.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.97.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.97.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.97.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.97.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.97.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.98.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.98.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.98.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.98.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.98.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.98.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.99.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.99.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.99.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.99.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.99.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.experts.99.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.gate.e_score_correction_bias": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.gate.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.shared_experts.down_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.shared_experts.down_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.shared_experts.gate_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.shared_experts.gate_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.shared_experts.up_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.mlp.shared_experts.up_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.post_attention_layernorm.weight": "model-00036-of-00092.safetensors", + "model.layers.35.self_attn.k_norm.weight": "model-00036-of-00092.safetensors", + "model.layers.35.self_attn.k_proj.bias": "model-00036-of-00092.safetensors", + "model.layers.35.self_attn.k_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.self_attn.k_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.self_attn.o_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.self_attn.o_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.self_attn.q_norm.weight": "model-00036-of-00092.safetensors", + "model.layers.35.self_attn.q_proj.bias": "model-00036-of-00092.safetensors", + "model.layers.35.self_attn.q_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.self_attn.q_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.35.self_attn.v_proj.bias": "model-00036-of-00092.safetensors", + "model.layers.35.self_attn.v_proj.weight": "model-00036-of-00092.safetensors", + "model.layers.35.self_attn.v_proj.weight_scale": "model-00036-of-00092.safetensors", + "model.layers.36.input_layernorm.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.0.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.0.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.0.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.0.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.0.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.0.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.1.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.1.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.1.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.1.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.1.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.1.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.10.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.10.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.10.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.10.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.10.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.10.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.100.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.100.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.100.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.100.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.100.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.100.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.101.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.101.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.101.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.101.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.101.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.101.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.102.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.102.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.102.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.102.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.102.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.102.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.103.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.103.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.103.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.103.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.103.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.103.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.104.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.104.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.104.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.104.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.104.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.104.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.105.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.105.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.105.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.105.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.105.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.105.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.106.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.106.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.106.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.106.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.106.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.106.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.107.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.107.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.107.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.107.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.107.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.107.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.108.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.108.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.108.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.108.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.108.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.108.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.109.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.109.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.109.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.109.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.109.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.109.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.11.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.11.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.11.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.11.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.11.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.11.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.110.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.110.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.110.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.110.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.110.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.110.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.111.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.111.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.111.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.111.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.111.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.111.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.112.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.112.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.112.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.112.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.112.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.112.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.113.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.113.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.113.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.113.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.113.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.113.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.114.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.114.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.114.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.114.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.114.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.114.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.115.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.115.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.115.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.115.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.115.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.115.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.116.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.116.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.116.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.116.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.116.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.116.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.117.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.117.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.117.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.117.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.117.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.117.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.118.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.118.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.118.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.118.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.118.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.118.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.119.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.119.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.119.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.119.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.119.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.119.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.12.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.12.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.12.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.12.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.12.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.12.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.120.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.120.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.120.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.120.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.120.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.120.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.121.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.121.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.121.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.121.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.121.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.121.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.122.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.122.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.122.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.122.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.122.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.122.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.123.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.123.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.123.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.123.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.123.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.123.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.124.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.124.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.124.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.124.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.124.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.124.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.125.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.125.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.125.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.125.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.125.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.125.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.126.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.126.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.126.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.126.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.126.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.126.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.127.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.127.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.127.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.127.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.127.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.127.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.128.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.128.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.128.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.128.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.128.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.128.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.129.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.129.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.129.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.129.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.129.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.129.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.13.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.13.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.13.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.13.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.13.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.13.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.130.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.130.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.130.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.130.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.130.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.130.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.131.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.131.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.131.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.131.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.131.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.131.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.132.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.132.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.132.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.132.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.132.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.132.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.133.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.133.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.133.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.133.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.133.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.133.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.134.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.134.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.134.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.134.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.134.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.134.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.135.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.135.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.135.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.135.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.135.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.135.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.136.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.136.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.136.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.136.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.136.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.136.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.137.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.137.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.137.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.137.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.137.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.137.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.138.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.138.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.138.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.138.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.138.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.138.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.139.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.139.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.139.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.139.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.139.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.139.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.14.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.14.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.14.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.14.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.14.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.14.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.140.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.140.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.140.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.140.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.140.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.140.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.141.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.141.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.141.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.141.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.141.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.141.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.142.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.142.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.142.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.142.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.142.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.142.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.143.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.143.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.143.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.143.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.143.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.143.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.144.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.144.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.144.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.144.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.144.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.144.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.145.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.145.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.145.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.145.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.145.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.145.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.146.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.146.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.146.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.146.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.146.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.146.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.147.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.147.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.147.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.147.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.147.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.147.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.148.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.148.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.148.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.148.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.148.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.148.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.149.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.149.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.149.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.149.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.149.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.149.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.15.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.15.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.15.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.15.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.15.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.15.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.150.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.150.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.150.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.150.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.150.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.150.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.151.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.151.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.151.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.151.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.151.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.151.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.152.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.152.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.152.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.152.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.152.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.152.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.153.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.153.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.153.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.153.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.153.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.153.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.154.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.154.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.154.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.154.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.154.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.154.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.155.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.155.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.155.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.155.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.155.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.155.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.156.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.156.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.156.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.156.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.156.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.156.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.157.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.157.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.157.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.157.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.157.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.157.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.158.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.158.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.158.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.158.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.158.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.158.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.159.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.159.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.159.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.159.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.159.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.159.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.16.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.16.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.16.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.16.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.16.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.16.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.17.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.17.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.17.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.17.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.17.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.17.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.18.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.18.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.18.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.18.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.18.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.18.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.19.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.19.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.19.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.19.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.19.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.19.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.2.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.2.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.2.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.2.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.2.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.2.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.20.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.20.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.20.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.20.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.20.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.20.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.21.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.21.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.21.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.21.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.21.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.21.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.22.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.22.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.22.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.22.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.22.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.22.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.23.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.23.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.23.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.23.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.23.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.23.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.24.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.24.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.24.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.24.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.24.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.24.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.25.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.25.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.25.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.25.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.25.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.25.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.26.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.26.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.26.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.26.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.26.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.26.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.27.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.27.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.27.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.27.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.27.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.27.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.28.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.28.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.28.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.28.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.28.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.28.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.29.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.29.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.29.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.29.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.29.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.29.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.3.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.3.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.3.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.3.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.3.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.3.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.30.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.30.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.30.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.30.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.30.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.30.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.31.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.31.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.31.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.31.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.31.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.31.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.32.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.32.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.32.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.32.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.32.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.32.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.33.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.33.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.33.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.33.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.33.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.33.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.34.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.34.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.34.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.34.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.34.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.34.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.35.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.35.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.35.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.35.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.35.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.35.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.36.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.36.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.36.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.36.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.36.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.36.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.37.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.37.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.37.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.37.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.37.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.37.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.38.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.38.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.38.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.38.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.38.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.38.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.39.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.39.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.39.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.39.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.39.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.39.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.4.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.4.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.4.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.4.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.4.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.4.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.40.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.40.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.40.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.40.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.40.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.40.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.41.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.41.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.41.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.41.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.41.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.41.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.42.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.42.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.42.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.42.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.42.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.42.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.43.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.43.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.43.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.43.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.43.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.43.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.44.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.44.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.44.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.44.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.44.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.44.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.45.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.45.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.45.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.45.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.45.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.45.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.46.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.46.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.46.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.46.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.46.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.46.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.47.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.47.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.47.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.47.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.47.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.47.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.48.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.48.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.48.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.48.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.48.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.48.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.49.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.49.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.49.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.49.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.49.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.49.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.5.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.5.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.5.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.5.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.5.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.5.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.50.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.50.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.50.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.50.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.50.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.50.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.51.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.51.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.51.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.51.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.51.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.51.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.52.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.52.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.52.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.52.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.52.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.52.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.53.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.53.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.53.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.53.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.53.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.53.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.54.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.54.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.54.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.54.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.54.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.54.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.55.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.55.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.55.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.55.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.55.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.55.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.56.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.56.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.56.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.56.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.56.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.56.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.57.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.57.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.57.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.57.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.57.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.57.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.58.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.58.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.58.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.58.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.58.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.58.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.59.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.59.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.59.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.59.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.59.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.59.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.6.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.6.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.6.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.6.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.6.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.6.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.60.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.60.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.60.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.60.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.60.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.60.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.61.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.61.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.61.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.61.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.61.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.61.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.62.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.62.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.62.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.62.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.62.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.62.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.63.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.63.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.63.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.63.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.63.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.63.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.64.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.64.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.64.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.64.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.64.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.64.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.65.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.65.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.65.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.65.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.65.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.65.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.66.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.66.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.66.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.66.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.66.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.66.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.67.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.67.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.67.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.67.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.67.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.67.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.68.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.68.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.68.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.68.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.68.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.68.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.69.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.69.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.69.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.69.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.69.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.69.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.7.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.7.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.7.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.7.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.7.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.7.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.70.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.70.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.70.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.70.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.70.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.70.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.71.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.71.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.71.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.71.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.71.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.71.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.72.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.72.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.72.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.72.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.72.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.72.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.73.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.73.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.73.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.73.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.73.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.73.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.74.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.74.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.74.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.74.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.74.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.74.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.75.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.75.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.75.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.75.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.75.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.75.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.76.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.76.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.76.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.76.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.76.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.76.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.77.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.77.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.77.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.77.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.77.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.77.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.78.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.78.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.78.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.78.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.78.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.78.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.79.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.79.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.79.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.79.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.79.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.79.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.8.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.8.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.8.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.8.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.8.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.8.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.80.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.80.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.80.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.80.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.80.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.80.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.81.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.81.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.81.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.81.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.81.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.81.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.82.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.82.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.82.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.82.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.82.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.82.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.83.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.83.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.83.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.83.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.83.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.83.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.84.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.84.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.84.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.84.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.84.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.84.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.85.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.85.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.85.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.85.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.85.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.85.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.86.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.86.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.86.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.86.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.86.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.86.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.87.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.87.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.87.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.87.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.87.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.87.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.88.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.88.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.88.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.88.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.88.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.88.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.89.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.89.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.89.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.89.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.89.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.89.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.9.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.9.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.9.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.9.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.9.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.9.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.90.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.90.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.90.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.90.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.90.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.90.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.91.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.91.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.91.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.91.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.91.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.91.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.92.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.92.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.92.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.92.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.92.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.92.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.93.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.93.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.93.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.93.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.93.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.93.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.94.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.94.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.94.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.94.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.94.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.94.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.95.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.95.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.95.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.95.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.95.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.95.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.96.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.96.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.96.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.96.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.96.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.96.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.97.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.97.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.97.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.97.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.97.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.97.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.98.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.98.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.98.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.98.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.98.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.98.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.99.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.99.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.99.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.99.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.99.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.experts.99.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.gate.e_score_correction_bias": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.gate.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.shared_experts.down_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.shared_experts.down_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.shared_experts.gate_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.shared_experts.gate_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.shared_experts.up_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.mlp.shared_experts.up_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.post_attention_layernorm.weight": "model-00037-of-00092.safetensors", + "model.layers.36.self_attn.k_norm.weight": "model-00037-of-00092.safetensors", + "model.layers.36.self_attn.k_proj.bias": "model-00037-of-00092.safetensors", + "model.layers.36.self_attn.k_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.self_attn.k_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.self_attn.o_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.self_attn.o_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.self_attn.q_norm.weight": "model-00037-of-00092.safetensors", + "model.layers.36.self_attn.q_proj.bias": "model-00037-of-00092.safetensors", + "model.layers.36.self_attn.q_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.self_attn.q_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.36.self_attn.v_proj.bias": "model-00037-of-00092.safetensors", + "model.layers.36.self_attn.v_proj.weight": "model-00037-of-00092.safetensors", + "model.layers.36.self_attn.v_proj.weight_scale": "model-00037-of-00092.safetensors", + "model.layers.37.input_layernorm.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.0.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.0.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.0.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.0.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.0.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.0.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.1.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.1.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.1.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.1.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.1.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.1.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.10.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.10.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.10.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.10.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.10.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.10.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.100.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.100.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.100.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.100.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.100.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.100.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.101.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.101.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.101.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.101.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.101.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.101.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.102.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.102.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.102.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.102.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.102.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.102.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.103.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.103.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.103.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.103.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.103.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.103.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.104.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.104.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.104.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.104.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.104.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.104.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.105.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.105.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.105.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.105.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.105.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.105.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.106.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.106.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.106.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.106.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.106.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.106.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.107.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.107.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.107.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.107.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.107.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.107.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.108.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.108.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.108.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.108.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.108.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.108.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.109.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.109.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.109.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.109.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.109.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.109.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.11.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.11.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.11.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.11.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.11.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.11.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.110.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.110.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.110.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.110.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.110.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.110.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.111.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.111.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.111.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.111.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.111.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.111.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.112.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.112.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.112.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.112.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.112.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.112.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.113.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.113.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.113.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.113.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.113.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.113.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.114.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.114.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.114.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.114.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.114.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.114.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.115.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.115.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.115.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.115.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.115.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.115.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.116.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.116.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.116.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.116.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.116.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.116.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.117.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.117.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.117.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.117.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.117.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.117.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.118.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.118.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.118.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.118.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.118.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.118.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.119.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.119.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.119.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.119.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.119.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.119.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.12.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.12.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.12.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.12.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.12.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.12.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.120.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.120.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.120.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.120.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.120.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.120.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.121.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.121.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.121.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.121.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.121.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.121.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.122.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.122.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.122.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.122.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.122.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.122.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.123.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.123.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.123.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.123.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.123.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.123.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.124.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.124.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.124.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.124.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.124.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.124.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.125.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.125.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.125.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.125.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.125.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.125.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.126.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.126.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.126.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.126.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.126.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.126.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.127.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.127.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.127.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.127.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.127.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.127.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.128.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.128.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.128.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.128.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.128.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.128.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.129.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.129.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.129.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.129.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.129.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.129.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.13.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.13.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.13.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.13.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.13.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.13.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.130.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.130.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.130.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.130.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.130.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.130.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.131.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.131.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.131.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.131.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.131.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.131.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.132.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.132.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.132.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.132.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.132.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.132.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.133.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.133.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.133.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.133.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.133.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.133.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.134.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.134.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.134.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.134.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.134.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.134.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.135.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.135.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.135.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.135.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.135.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.135.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.136.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.136.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.136.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.136.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.136.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.136.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.137.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.137.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.137.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.137.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.137.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.137.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.138.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.138.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.138.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.138.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.138.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.138.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.139.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.139.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.139.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.139.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.139.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.139.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.14.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.14.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.14.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.14.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.14.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.14.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.140.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.140.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.140.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.140.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.140.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.140.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.141.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.141.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.141.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.141.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.141.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.141.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.142.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.142.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.142.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.142.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.142.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.142.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.143.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.143.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.143.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.143.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.143.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.143.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.144.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.144.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.144.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.144.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.144.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.144.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.145.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.145.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.145.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.145.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.145.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.145.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.146.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.146.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.146.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.146.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.146.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.146.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.147.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.147.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.147.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.147.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.147.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.147.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.148.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.148.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.148.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.148.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.148.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.148.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.149.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.149.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.149.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.149.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.149.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.149.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.15.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.15.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.15.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.15.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.15.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.15.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.150.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.150.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.150.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.150.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.150.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.150.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.151.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.151.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.151.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.151.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.151.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.151.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.152.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.152.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.152.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.152.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.152.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.152.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.153.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.153.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.153.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.153.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.153.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.153.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.154.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.154.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.154.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.154.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.154.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.154.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.155.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.155.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.155.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.155.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.155.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.155.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.156.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.156.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.156.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.156.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.156.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.156.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.157.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.157.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.157.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.157.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.157.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.157.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.158.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.158.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.158.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.158.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.158.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.158.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.159.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.159.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.159.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.159.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.159.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.159.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.16.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.16.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.16.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.16.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.16.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.16.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.17.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.17.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.17.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.17.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.17.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.17.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.18.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.18.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.18.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.18.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.18.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.18.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.19.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.19.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.19.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.19.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.19.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.19.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.2.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.2.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.2.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.2.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.2.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.2.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.20.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.20.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.20.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.20.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.20.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.20.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.21.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.21.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.21.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.21.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.21.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.21.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.22.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.22.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.22.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.22.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.22.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.22.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.23.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.23.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.23.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.23.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.23.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.23.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.24.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.24.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.24.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.24.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.24.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.24.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.25.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.25.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.25.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.25.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.25.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.25.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.26.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.26.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.26.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.26.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.26.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.26.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.27.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.27.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.27.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.27.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.27.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.27.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.28.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.28.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.28.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.28.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.28.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.28.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.29.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.29.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.29.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.29.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.29.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.29.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.3.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.3.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.3.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.3.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.3.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.3.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.30.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.30.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.30.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.30.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.30.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.30.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.31.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.31.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.31.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.31.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.31.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.31.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.32.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.32.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.32.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.32.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.32.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.32.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.33.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.33.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.33.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.33.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.33.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.33.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.34.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.34.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.34.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.34.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.34.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.34.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.35.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.35.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.35.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.35.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.35.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.35.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.36.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.36.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.36.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.36.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.36.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.36.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.37.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.37.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.37.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.37.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.37.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.37.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.38.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.38.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.38.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.38.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.38.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.38.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.39.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.39.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.39.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.39.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.39.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.39.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.4.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.4.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.4.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.4.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.4.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.4.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.40.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.40.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.40.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.40.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.40.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.40.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.41.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.41.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.41.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.41.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.41.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.41.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.42.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.42.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.42.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.42.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.42.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.42.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.43.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.43.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.43.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.43.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.43.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.43.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.44.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.44.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.44.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.44.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.44.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.44.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.45.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.45.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.45.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.45.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.45.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.45.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.46.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.46.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.46.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.46.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.46.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.46.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.47.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.47.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.47.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.47.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.47.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.47.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.48.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.48.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.48.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.48.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.48.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.48.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.49.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.49.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.49.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.49.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.49.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.49.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.5.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.5.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.5.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.5.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.5.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.5.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.50.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.50.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.50.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.50.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.50.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.50.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.51.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.51.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.51.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.51.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.51.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.51.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.52.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.52.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.52.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.52.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.52.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.52.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.53.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.53.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.53.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.53.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.53.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.53.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.54.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.54.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.54.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.54.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.54.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.54.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.55.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.55.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.55.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.55.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.55.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.55.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.56.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.56.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.56.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.56.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.56.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.56.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.57.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.57.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.57.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.57.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.57.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.57.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.58.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.58.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.58.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.58.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.58.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.58.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.59.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.59.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.59.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.59.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.59.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.59.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.6.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.6.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.6.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.6.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.6.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.6.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.60.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.60.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.60.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.60.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.60.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.60.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.61.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.61.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.61.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.61.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.61.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.61.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.62.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.62.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.62.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.62.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.62.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.62.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.63.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.63.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.63.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.63.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.63.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.63.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.64.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.64.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.64.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.64.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.64.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.64.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.65.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.65.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.65.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.65.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.65.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.65.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.66.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.66.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.66.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.66.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.66.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.66.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.67.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.67.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.67.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.67.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.67.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.67.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.68.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.68.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.68.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.68.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.68.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.68.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.69.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.69.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.69.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.69.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.69.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.69.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.7.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.7.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.7.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.7.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.7.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.7.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.70.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.70.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.70.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.70.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.70.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.70.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.71.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.71.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.71.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.71.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.71.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.71.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.72.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.72.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.72.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.72.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.72.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.72.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.73.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.73.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.73.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.73.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.73.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.73.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.74.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.74.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.74.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.74.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.74.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.74.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.75.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.75.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.75.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.75.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.75.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.75.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.76.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.76.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.76.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.76.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.76.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.76.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.77.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.77.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.77.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.77.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.77.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.77.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.78.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.78.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.78.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.78.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.78.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.78.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.79.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.79.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.79.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.79.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.79.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.79.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.8.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.8.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.8.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.8.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.8.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.8.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.80.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.80.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.80.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.80.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.80.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.80.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.81.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.81.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.81.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.81.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.81.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.81.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.82.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.82.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.82.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.82.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.82.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.82.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.83.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.83.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.83.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.83.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.83.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.83.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.84.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.84.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.84.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.84.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.84.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.84.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.85.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.85.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.85.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.85.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.85.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.85.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.86.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.86.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.86.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.86.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.86.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.86.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.87.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.87.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.87.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.87.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.87.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.87.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.88.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.88.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.88.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.88.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.88.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.88.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.89.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.89.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.89.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.89.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.89.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.89.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.9.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.9.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.9.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.9.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.9.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.9.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.90.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.90.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.90.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.90.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.90.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.90.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.91.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.91.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.91.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.91.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.91.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.91.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.92.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.92.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.92.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.92.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.92.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.92.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.93.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.93.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.93.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.93.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.93.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.93.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.94.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.94.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.94.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.94.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.94.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.94.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.95.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.95.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.95.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.95.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.95.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.95.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.96.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.96.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.96.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.96.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.96.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.96.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.97.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.97.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.97.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.97.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.97.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.97.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.98.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.98.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.98.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.98.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.98.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.98.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.99.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.99.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.99.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.99.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.99.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.experts.99.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.gate.e_score_correction_bias": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.gate.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.shared_experts.down_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.shared_experts.down_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.shared_experts.gate_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.shared_experts.gate_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.shared_experts.up_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.mlp.shared_experts.up_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.post_attention_layernorm.weight": "model-00038-of-00092.safetensors", + "model.layers.37.self_attn.k_norm.weight": "model-00038-of-00092.safetensors", + "model.layers.37.self_attn.k_proj.bias": "model-00038-of-00092.safetensors", + "model.layers.37.self_attn.k_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.self_attn.k_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.self_attn.o_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.self_attn.o_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.self_attn.q_norm.weight": "model-00038-of-00092.safetensors", + "model.layers.37.self_attn.q_proj.bias": "model-00038-of-00092.safetensors", + "model.layers.37.self_attn.q_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.self_attn.q_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.37.self_attn.v_proj.bias": "model-00038-of-00092.safetensors", + "model.layers.37.self_attn.v_proj.weight": "model-00038-of-00092.safetensors", + "model.layers.37.self_attn.v_proj.weight_scale": "model-00038-of-00092.safetensors", + "model.layers.38.input_layernorm.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.0.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.0.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.0.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.0.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.0.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.0.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.1.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.1.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.1.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.1.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.1.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.1.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.10.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.10.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.10.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.10.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.10.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.10.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.100.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.100.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.100.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.100.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.100.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.100.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.101.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.101.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.101.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.101.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.101.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.101.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.102.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.102.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.102.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.102.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.102.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.102.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.103.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.103.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.103.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.103.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.103.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.103.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.104.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.104.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.104.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.104.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.104.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.104.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.105.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.105.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.105.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.105.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.105.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.105.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.106.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.106.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.106.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.106.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.106.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.106.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.107.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.107.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.107.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.107.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.107.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.107.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.108.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.108.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.108.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.108.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.108.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.108.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.109.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.109.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.109.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.109.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.109.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.109.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.11.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.11.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.11.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.11.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.11.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.11.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.110.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.110.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.110.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.110.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.110.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.110.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.111.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.111.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.111.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.111.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.111.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.111.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.112.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.112.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.112.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.112.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.112.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.112.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.113.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.113.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.113.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.113.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.113.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.113.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.114.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.114.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.114.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.114.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.114.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.114.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.115.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.115.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.115.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.115.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.115.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.115.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.116.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.116.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.116.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.116.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.116.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.116.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.117.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.117.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.117.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.117.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.117.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.117.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.118.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.118.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.118.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.118.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.118.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.118.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.119.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.119.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.119.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.119.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.119.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.119.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.12.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.12.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.12.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.12.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.12.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.12.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.120.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.120.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.120.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.120.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.120.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.120.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.121.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.121.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.121.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.121.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.121.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.121.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.122.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.122.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.122.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.122.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.122.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.122.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.123.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.123.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.123.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.123.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.123.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.123.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.124.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.124.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.124.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.124.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.124.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.124.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.125.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.125.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.125.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.125.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.125.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.125.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.126.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.126.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.126.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.126.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.126.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.126.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.127.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.127.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.127.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.127.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.127.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.127.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.128.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.128.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.128.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.128.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.128.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.128.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.129.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.129.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.129.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.129.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.129.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.129.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.13.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.13.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.13.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.13.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.13.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.13.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.130.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.130.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.130.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.130.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.130.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.130.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.131.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.131.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.131.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.131.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.131.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.131.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.132.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.132.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.132.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.132.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.132.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.132.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.133.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.133.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.133.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.133.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.133.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.133.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.134.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.134.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.134.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.134.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.134.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.134.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.135.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.135.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.135.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.135.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.135.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.135.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.136.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.136.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.136.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.136.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.136.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.136.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.137.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.137.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.137.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.137.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.137.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.137.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.138.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.138.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.138.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.138.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.138.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.138.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.139.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.139.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.139.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.139.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.139.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.139.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.14.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.14.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.14.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.14.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.14.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.14.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.140.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.140.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.140.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.140.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.140.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.140.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.141.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.141.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.141.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.141.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.141.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.141.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.142.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.142.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.142.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.142.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.142.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.142.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.143.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.143.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.143.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.143.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.143.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.143.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.144.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.144.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.144.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.144.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.144.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.144.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.145.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.145.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.145.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.145.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.145.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.145.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.146.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.146.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.146.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.146.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.146.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.146.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.147.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.147.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.147.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.147.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.147.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.147.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.148.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.148.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.148.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.148.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.148.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.148.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.149.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.149.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.149.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.149.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.149.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.149.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.15.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.15.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.15.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.15.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.15.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.15.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.150.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.150.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.150.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.150.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.150.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.150.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.151.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.151.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.151.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.151.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.151.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.151.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.152.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.152.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.152.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.152.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.152.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.152.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.153.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.153.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.153.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.153.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.153.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.153.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.154.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.154.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.154.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.154.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.154.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.154.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.155.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.155.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.155.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.155.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.155.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.155.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.156.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.156.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.156.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.156.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.156.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.156.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.157.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.157.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.157.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.157.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.157.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.157.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.158.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.158.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.158.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.158.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.158.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.158.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.159.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.159.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.159.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.159.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.159.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.159.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.16.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.16.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.16.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.16.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.16.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.16.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.17.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.17.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.17.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.17.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.17.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.17.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.18.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.18.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.18.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.18.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.18.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.18.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.19.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.19.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.19.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.19.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.19.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.19.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.2.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.2.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.2.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.2.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.2.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.2.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.20.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.20.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.20.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.20.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.20.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.20.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.21.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.21.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.21.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.21.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.21.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.21.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.22.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.22.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.22.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.22.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.22.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.22.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.23.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.23.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.23.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.23.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.23.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.23.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.24.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.24.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.24.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.24.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.24.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.24.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.25.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.25.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.25.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.25.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.25.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.25.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.26.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.26.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.26.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.26.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.26.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.26.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.27.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.27.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.27.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.27.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.27.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.27.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.28.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.28.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.28.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.28.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.28.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.28.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.29.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.29.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.29.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.29.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.29.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.29.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.3.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.3.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.3.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.3.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.3.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.3.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.30.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.30.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.30.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.30.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.30.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.30.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.31.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.31.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.31.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.31.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.31.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.31.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.32.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.32.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.32.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.32.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.32.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.32.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.33.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.33.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.33.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.33.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.33.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.33.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.34.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.34.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.34.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.34.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.34.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.34.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.35.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.35.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.35.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.35.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.35.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.35.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.36.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.36.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.36.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.36.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.36.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.36.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.37.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.37.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.37.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.37.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.37.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.37.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.38.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.38.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.38.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.38.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.38.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.38.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.39.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.39.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.39.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.39.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.39.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.39.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.4.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.4.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.4.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.4.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.4.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.4.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.40.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.40.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.40.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.40.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.40.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.40.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.41.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.41.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.41.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.41.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.41.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.41.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.42.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.42.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.42.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.42.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.42.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.42.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.43.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.43.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.43.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.43.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.43.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.43.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.44.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.44.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.44.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.44.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.44.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.44.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.45.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.45.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.45.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.45.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.45.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.45.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.46.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.46.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.46.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.46.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.46.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.46.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.47.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.47.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.47.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.47.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.47.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.47.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.48.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.48.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.48.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.48.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.48.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.48.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.49.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.49.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.49.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.49.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.49.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.49.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.5.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.5.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.5.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.5.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.5.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.5.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.50.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.50.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.50.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.50.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.50.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.50.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.51.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.51.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.51.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.51.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.51.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.51.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.52.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.52.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.52.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.52.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.52.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.52.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.53.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.53.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.53.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.53.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.53.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.53.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.54.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.54.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.54.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.54.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.54.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.54.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.55.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.55.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.55.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.55.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.55.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.55.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.56.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.56.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.56.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.56.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.56.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.56.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.57.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.57.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.57.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.57.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.57.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.57.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.58.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.58.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.58.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.58.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.58.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.58.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.59.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.59.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.59.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.59.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.59.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.59.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.6.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.6.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.6.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.6.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.6.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.6.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.60.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.60.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.60.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.60.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.60.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.60.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.61.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.61.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.61.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.61.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.61.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.61.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.62.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.62.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.62.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.62.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.62.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.62.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.63.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.63.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.63.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.63.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.63.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.63.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.64.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.64.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.64.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.64.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.64.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.64.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.65.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.65.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.65.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.65.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.65.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.65.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.66.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.66.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.66.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.66.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.66.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.66.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.67.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.67.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.67.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.67.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.67.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.67.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.68.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.68.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.68.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.68.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.68.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.68.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.69.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.69.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.69.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.69.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.69.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.69.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.7.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.7.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.7.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.7.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.7.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.7.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.70.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.70.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.70.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.70.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.70.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.70.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.71.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.71.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.71.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.71.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.71.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.71.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.72.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.72.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.72.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.72.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.72.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.72.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.73.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.73.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.73.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.73.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.73.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.73.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.74.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.74.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.74.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.74.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.74.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.74.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.75.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.75.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.75.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.75.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.75.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.75.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.76.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.76.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.76.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.76.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.76.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.76.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.77.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.77.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.77.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.77.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.77.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.77.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.78.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.78.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.78.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.78.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.78.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.78.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.79.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.79.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.79.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.79.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.79.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.79.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.8.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.8.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.8.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.8.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.8.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.8.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.80.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.80.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.80.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.80.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.80.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.80.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.81.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.81.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.81.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.81.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.81.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.81.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.82.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.82.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.82.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.82.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.82.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.82.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.83.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.83.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.83.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.83.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.83.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.83.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.84.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.84.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.84.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.84.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.84.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.84.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.85.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.85.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.85.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.85.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.85.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.85.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.86.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.86.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.86.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.86.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.86.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.86.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.87.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.87.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.87.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.87.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.87.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.87.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.88.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.88.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.88.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.88.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.88.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.88.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.89.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.89.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.89.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.89.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.89.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.89.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.9.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.9.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.9.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.9.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.9.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.9.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.90.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.90.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.90.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.90.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.90.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.90.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.91.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.91.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.91.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.91.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.91.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.91.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.92.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.92.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.92.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.92.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.92.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.92.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.93.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.93.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.93.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.93.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.93.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.93.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.94.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.94.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.94.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.94.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.94.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.94.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.95.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.95.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.95.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.95.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.95.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.95.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.96.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.96.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.96.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.96.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.96.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.96.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.97.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.97.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.97.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.97.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.97.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.97.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.98.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.98.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.98.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.98.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.98.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.98.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.99.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.99.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.99.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.99.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.99.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.experts.99.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.gate.e_score_correction_bias": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.gate.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.shared_experts.down_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.shared_experts.down_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.shared_experts.gate_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.shared_experts.gate_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.shared_experts.up_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.mlp.shared_experts.up_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.post_attention_layernorm.weight": "model-00039-of-00092.safetensors", + "model.layers.38.self_attn.k_norm.weight": "model-00039-of-00092.safetensors", + "model.layers.38.self_attn.k_proj.bias": "model-00039-of-00092.safetensors", + "model.layers.38.self_attn.k_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.self_attn.k_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.self_attn.o_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.self_attn.o_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.self_attn.q_norm.weight": "model-00039-of-00092.safetensors", + "model.layers.38.self_attn.q_proj.bias": "model-00039-of-00092.safetensors", + "model.layers.38.self_attn.q_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.self_attn.q_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.38.self_attn.v_proj.bias": "model-00039-of-00092.safetensors", + "model.layers.38.self_attn.v_proj.weight": "model-00039-of-00092.safetensors", + "model.layers.38.self_attn.v_proj.weight_scale": "model-00039-of-00092.safetensors", + "model.layers.39.input_layernorm.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.0.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.0.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.0.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.0.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.0.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.0.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.1.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.1.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.1.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.1.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.1.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.1.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.10.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.10.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.10.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.10.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.10.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.10.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.100.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.100.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.100.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.100.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.100.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.100.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.101.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.101.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.101.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.101.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.101.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.101.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.102.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.102.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.102.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.102.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.102.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.102.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.103.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.103.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.103.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.103.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.103.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.103.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.104.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.104.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.104.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.104.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.104.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.104.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.105.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.105.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.105.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.105.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.105.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.105.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.106.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.106.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.106.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.106.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.106.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.106.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.107.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.107.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.107.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.107.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.107.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.107.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.108.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.108.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.108.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.108.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.108.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.108.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.109.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.109.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.109.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.109.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.109.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.109.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.11.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.11.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.11.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.11.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.11.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.11.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.110.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.110.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.110.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.110.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.110.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.110.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.111.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.111.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.111.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.111.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.111.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.111.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.112.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.112.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.112.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.112.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.112.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.112.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.113.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.113.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.113.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.113.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.113.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.113.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.114.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.114.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.114.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.114.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.114.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.114.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.115.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.115.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.115.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.115.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.115.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.115.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.116.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.116.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.116.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.116.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.116.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.116.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.117.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.117.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.117.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.117.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.117.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.117.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.118.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.118.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.118.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.118.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.118.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.118.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.119.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.119.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.119.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.119.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.119.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.119.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.12.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.12.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.12.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.12.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.12.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.12.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.120.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.120.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.120.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.120.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.120.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.120.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.121.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.121.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.121.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.121.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.121.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.121.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.122.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.122.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.122.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.122.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.122.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.122.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.123.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.123.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.123.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.123.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.123.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.123.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.124.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.124.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.124.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.124.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.124.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.124.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.125.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.125.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.125.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.125.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.125.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.125.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.126.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.126.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.126.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.126.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.126.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.126.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.127.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.127.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.127.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.127.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.127.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.127.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.128.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.128.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.128.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.128.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.128.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.128.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.129.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.129.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.129.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.129.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.129.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.129.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.13.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.13.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.13.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.13.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.13.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.13.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.130.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.130.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.130.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.130.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.130.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.130.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.131.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.131.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.131.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.131.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.131.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.131.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.132.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.132.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.132.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.132.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.132.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.132.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.133.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.133.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.133.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.133.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.133.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.133.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.134.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.134.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.134.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.134.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.134.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.134.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.135.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.135.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.135.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.135.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.135.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.135.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.136.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.136.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.136.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.136.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.136.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.136.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.137.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.137.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.137.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.137.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.137.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.137.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.138.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.138.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.138.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.138.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.138.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.138.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.139.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.139.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.139.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.139.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.139.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.139.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.14.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.14.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.14.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.14.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.14.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.14.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.140.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.140.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.140.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.140.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.140.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.140.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.141.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.141.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.141.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.141.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.141.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.141.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.142.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.142.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.142.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.142.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.142.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.142.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.143.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.143.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.143.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.143.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.143.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.143.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.144.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.144.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.144.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.144.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.144.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.144.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.145.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.145.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.145.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.145.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.145.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.145.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.146.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.146.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.146.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.146.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.146.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.146.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.147.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.147.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.147.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.147.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.147.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.147.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.148.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.148.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.148.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.148.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.148.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.148.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.149.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.149.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.149.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.149.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.149.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.149.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.15.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.15.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.15.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.15.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.15.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.15.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.150.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.150.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.150.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.150.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.150.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.150.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.151.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.151.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.151.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.151.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.151.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.151.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.152.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.152.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.152.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.152.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.152.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.152.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.153.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.153.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.153.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.153.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.153.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.153.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.154.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.154.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.154.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.154.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.154.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.154.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.155.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.155.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.155.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.155.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.155.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.155.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.156.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.156.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.156.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.156.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.156.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.156.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.157.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.157.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.157.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.157.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.157.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.157.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.158.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.158.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.158.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.158.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.158.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.158.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.159.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.159.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.159.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.159.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.159.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.159.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.16.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.16.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.16.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.16.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.16.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.16.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.17.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.17.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.17.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.17.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.17.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.17.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.18.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.18.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.18.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.18.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.18.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.18.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.19.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.19.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.19.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.19.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.19.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.19.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.2.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.2.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.2.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.2.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.2.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.2.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.20.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.20.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.20.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.20.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.20.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.20.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.21.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.21.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.21.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.21.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.21.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.21.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.22.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.22.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.22.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.22.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.22.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.22.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.23.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.23.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.23.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.23.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.23.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.23.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.24.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.24.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.24.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.24.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.24.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.24.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.25.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.25.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.25.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.25.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.25.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.25.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.26.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.26.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.26.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.26.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.26.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.26.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.27.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.27.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.27.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.27.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.27.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.27.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.28.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.28.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.28.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.28.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.28.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.28.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.29.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.29.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.29.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.29.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.29.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.29.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.3.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.3.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.3.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.3.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.3.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.3.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.30.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.30.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.30.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.30.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.30.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.30.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.31.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.31.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.31.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.31.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.31.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.31.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.32.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.32.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.32.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.32.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.32.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.32.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.33.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.33.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.33.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.33.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.33.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.33.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.34.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.34.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.34.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.34.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.34.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.34.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.35.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.35.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.35.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.35.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.35.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.35.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.36.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.36.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.36.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.36.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.36.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.36.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.37.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.37.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.37.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.37.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.37.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.37.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.38.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.38.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.38.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.38.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.38.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.38.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.39.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.39.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.39.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.39.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.39.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.39.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.4.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.4.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.4.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.4.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.4.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.4.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.40.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.40.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.40.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.40.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.40.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.40.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.41.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.41.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.41.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.41.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.41.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.41.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.42.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.42.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.42.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.42.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.42.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.42.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.43.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.43.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.43.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.43.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.43.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.43.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.44.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.44.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.44.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.44.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.44.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.44.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.45.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.45.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.45.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.45.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.45.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.45.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.46.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.46.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.46.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.46.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.46.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.46.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.47.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.47.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.47.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.47.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.47.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.47.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.48.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.48.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.48.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.48.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.48.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.48.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.49.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.49.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.49.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.49.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.49.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.49.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.5.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.5.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.5.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.5.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.5.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.5.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.50.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.50.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.50.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.50.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.50.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.50.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.51.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.51.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.51.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.51.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.51.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.51.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.52.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.52.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.52.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.52.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.52.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.52.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.53.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.53.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.53.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.53.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.53.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.53.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.54.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.54.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.54.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.54.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.54.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.54.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.55.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.55.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.55.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.55.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.55.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.55.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.56.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.56.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.56.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.56.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.56.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.56.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.57.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.57.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.57.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.57.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.57.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.57.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.58.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.58.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.58.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.58.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.58.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.58.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.59.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.59.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.59.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.59.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.59.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.59.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.6.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.6.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.6.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.6.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.6.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.6.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.60.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.60.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.60.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.60.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.60.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.60.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.61.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.61.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.61.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.61.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.61.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.61.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.62.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.62.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.62.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.62.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.62.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.62.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.63.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.63.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.63.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.63.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.63.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.63.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.64.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.64.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.64.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.64.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.64.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.64.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.65.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.65.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.65.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.65.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.65.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.65.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.66.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.66.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.66.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.66.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.66.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.66.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.67.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.67.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.67.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.67.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.67.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.67.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.68.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.68.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.68.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.68.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.68.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.68.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.69.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.69.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.69.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.69.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.69.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.69.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.7.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.7.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.7.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.7.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.7.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.7.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.70.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.70.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.70.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.70.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.70.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.70.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.71.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.71.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.71.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.71.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.71.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.71.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.72.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.72.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.72.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.72.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.72.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.72.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.73.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.73.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.73.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.73.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.73.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.73.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.74.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.74.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.74.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.74.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.74.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.74.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.75.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.75.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.75.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.75.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.75.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.75.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.76.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.76.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.76.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.76.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.76.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.76.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.77.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.77.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.77.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.77.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.77.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.77.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.78.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.78.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.78.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.78.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.78.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.78.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.79.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.79.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.79.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.79.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.79.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.79.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.8.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.8.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.8.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.8.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.8.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.8.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.80.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.80.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.80.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.80.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.80.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.80.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.81.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.81.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.81.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.81.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.81.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.81.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.82.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.82.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.82.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.82.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.82.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.82.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.83.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.83.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.83.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.83.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.83.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.83.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.84.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.84.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.84.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.84.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.84.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.84.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.85.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.85.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.85.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.85.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.85.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.85.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.86.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.86.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.86.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.86.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.86.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.86.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.87.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.87.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.87.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.87.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.87.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.87.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.88.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.88.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.88.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.88.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.88.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.88.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.89.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.89.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.89.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.89.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.89.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.89.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.9.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.9.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.9.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.9.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.9.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.9.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.90.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.90.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.90.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.90.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.90.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.90.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.91.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.91.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.91.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.91.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.91.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.91.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.92.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.92.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.92.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.92.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.92.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.92.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.93.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.93.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.93.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.93.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.93.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.93.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.94.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.94.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.94.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.94.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.94.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.94.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.95.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.95.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.95.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.95.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.95.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.95.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.96.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.96.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.96.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.96.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.96.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.96.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.97.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.97.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.97.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.97.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.97.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.97.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.98.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.98.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.98.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.98.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.98.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.98.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.99.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.99.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.99.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.99.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.99.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.experts.99.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.gate.e_score_correction_bias": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.gate.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.shared_experts.down_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.shared_experts.down_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.shared_experts.gate_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.shared_experts.gate_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.shared_experts.up_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.mlp.shared_experts.up_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.post_attention_layernorm.weight": "model-00040-of-00092.safetensors", + "model.layers.39.self_attn.k_norm.weight": "model-00040-of-00092.safetensors", + "model.layers.39.self_attn.k_proj.bias": "model-00040-of-00092.safetensors", + "model.layers.39.self_attn.k_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.self_attn.k_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.self_attn.o_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.self_attn.o_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.self_attn.q_norm.weight": "model-00040-of-00092.safetensors", + "model.layers.39.self_attn.q_proj.bias": "model-00040-of-00092.safetensors", + "model.layers.39.self_attn.q_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.self_attn.q_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.39.self_attn.v_proj.bias": "model-00040-of-00092.safetensors", + "model.layers.39.self_attn.v_proj.weight": "model-00040-of-00092.safetensors", + "model.layers.39.self_attn.v_proj.weight_scale": "model-00040-of-00092.safetensors", + "model.layers.40.input_layernorm.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.0.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.0.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.0.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.0.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.0.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.0.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.1.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.1.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.1.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.1.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.1.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.1.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.10.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.10.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.10.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.10.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.10.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.10.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.100.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.100.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.100.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.100.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.100.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.100.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.101.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.101.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.101.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.101.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.101.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.101.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.102.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.102.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.102.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.102.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.102.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.102.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.103.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.103.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.103.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.103.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.103.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.103.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.104.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.104.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.104.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.104.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.104.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.104.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.105.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.105.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.105.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.105.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.105.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.105.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.106.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.106.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.106.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.106.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.106.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.106.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.107.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.107.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.107.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.107.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.107.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.107.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.108.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.108.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.108.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.108.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.108.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.108.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.109.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.109.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.109.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.109.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.109.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.109.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.11.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.11.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.11.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.11.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.11.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.11.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.110.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.110.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.110.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.110.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.110.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.110.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.111.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.111.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.111.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.111.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.111.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.111.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.112.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.112.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.112.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.112.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.112.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.112.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.113.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.113.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.113.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.113.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.113.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.113.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.114.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.114.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.114.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.114.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.114.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.114.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.115.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.115.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.115.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.115.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.115.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.115.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.116.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.116.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.116.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.116.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.116.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.116.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.117.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.117.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.117.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.117.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.117.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.117.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.118.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.118.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.118.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.118.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.118.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.118.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.119.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.119.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.119.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.119.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.119.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.119.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.12.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.12.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.12.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.12.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.12.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.12.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.120.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.120.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.120.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.120.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.120.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.120.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.121.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.121.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.121.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.121.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.121.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.121.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.122.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.122.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.122.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.122.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.122.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.122.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.123.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.123.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.123.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.123.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.123.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.123.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.124.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.124.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.124.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.124.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.124.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.124.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.125.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.125.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.125.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.125.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.125.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.125.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.126.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.126.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.126.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.126.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.126.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.126.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.127.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.127.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.127.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.127.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.127.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.127.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.128.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.128.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.128.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.128.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.128.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.128.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.129.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.129.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.129.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.129.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.129.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.129.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.13.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.13.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.13.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.13.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.13.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.13.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.130.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.130.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.130.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.130.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.130.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.130.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.131.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.131.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.131.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.131.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.131.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.131.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.132.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.132.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.132.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.132.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.132.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.132.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.133.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.133.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.133.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.133.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.133.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.133.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.134.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.134.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.134.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.134.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.134.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.134.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.135.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.135.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.135.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.135.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.135.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.135.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.136.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.136.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.136.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.136.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.136.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.136.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.137.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.137.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.137.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.137.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.137.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.137.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.138.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.138.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.138.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.138.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.138.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.138.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.139.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.139.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.139.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.139.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.139.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.139.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.14.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.14.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.14.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.14.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.14.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.14.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.140.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.140.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.140.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.140.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.140.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.140.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.141.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.141.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.141.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.141.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.141.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.141.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.142.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.142.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.142.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.142.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.142.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.142.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.143.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.143.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.143.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.143.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.143.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.143.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.144.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.144.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.144.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.144.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.144.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.144.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.145.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.145.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.145.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.145.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.145.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.145.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.146.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.146.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.146.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.146.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.146.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.146.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.147.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.147.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.147.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.147.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.147.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.147.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.148.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.148.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.148.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.148.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.148.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.148.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.149.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.149.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.149.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.149.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.149.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.149.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.15.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.15.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.15.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.15.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.15.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.15.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.150.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.150.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.150.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.150.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.150.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.150.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.151.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.151.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.151.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.151.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.151.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.151.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.152.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.152.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.152.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.152.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.152.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.152.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.153.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.153.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.153.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.153.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.153.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.153.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.154.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.154.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.154.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.154.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.154.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.154.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.155.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.155.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.155.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.155.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.155.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.155.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.156.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.156.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.156.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.156.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.156.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.156.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.157.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.157.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.157.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.157.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.157.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.157.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.158.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.158.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.158.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.158.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.158.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.158.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.159.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.159.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.159.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.159.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.159.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.159.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.16.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.16.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.16.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.16.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.16.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.16.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.17.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.17.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.17.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.17.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.17.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.17.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.18.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.18.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.18.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.18.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.18.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.18.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.19.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.19.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.19.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.19.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.19.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.19.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.2.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.2.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.2.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.2.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.2.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.2.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.20.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.20.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.20.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.20.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.20.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.20.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.21.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.21.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.21.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.21.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.21.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.21.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.22.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.22.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.22.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.22.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.22.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.22.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.23.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.23.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.23.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.23.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.23.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.23.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.24.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.24.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.24.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.24.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.24.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.24.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.25.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.25.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.25.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.25.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.25.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.25.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.26.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.26.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.26.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.26.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.26.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.26.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.27.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.27.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.27.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.27.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.27.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.27.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.28.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.28.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.28.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.28.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.28.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.28.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.29.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.29.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.29.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.29.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.29.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.29.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.3.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.3.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.3.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.3.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.3.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.3.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.30.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.30.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.30.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.30.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.30.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.30.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.31.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.31.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.31.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.31.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.31.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.31.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.32.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.32.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.32.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.32.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.32.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.32.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.33.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.33.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.33.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.33.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.33.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.33.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.34.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.34.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.34.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.34.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.34.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.34.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.35.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.35.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.35.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.35.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.35.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.35.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.36.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.36.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.36.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.36.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.36.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.36.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.37.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.37.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.37.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.37.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.37.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.37.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.38.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.38.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.38.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.38.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.38.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.38.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.39.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.39.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.39.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.39.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.39.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.39.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.4.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.4.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.4.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.4.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.4.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.4.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.40.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.40.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.40.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.40.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.40.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.40.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.41.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.41.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.41.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.41.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.41.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.41.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.42.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.42.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.42.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.42.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.42.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.42.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.43.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.43.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.43.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.43.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.43.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.43.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.44.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.44.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.44.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.44.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.44.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.44.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.45.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.45.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.45.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.45.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.45.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.45.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.46.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.46.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.46.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.46.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.46.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.46.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.47.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.47.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.47.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.47.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.47.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.47.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.48.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.48.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.48.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.48.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.48.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.48.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.49.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.49.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.49.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.49.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.49.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.49.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.5.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.5.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.5.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.5.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.5.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.5.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.50.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.50.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.50.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.50.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.50.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.50.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.51.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.51.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.51.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.51.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.51.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.51.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.52.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.52.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.52.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.52.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.52.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.52.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.53.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.53.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.53.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.53.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.53.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.53.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.54.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.54.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.54.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.54.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.54.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.54.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.55.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.55.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.55.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.55.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.55.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.55.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.56.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.56.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.56.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.56.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.56.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.56.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.57.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.57.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.57.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.57.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.57.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.57.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.58.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.58.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.58.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.58.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.58.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.58.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.59.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.59.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.59.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.59.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.59.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.59.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.6.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.6.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.6.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.6.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.6.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.6.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.60.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.60.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.60.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.60.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.60.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.60.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.61.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.61.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.61.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.61.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.61.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.61.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.62.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.62.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.62.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.62.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.62.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.62.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.63.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.63.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.63.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.63.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.63.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.63.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.64.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.64.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.64.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.64.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.64.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.64.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.65.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.65.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.65.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.65.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.65.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.65.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.66.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.66.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.66.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.66.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.66.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.66.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.67.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.67.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.67.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.67.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.67.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.67.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.68.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.68.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.68.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.68.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.68.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.68.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.69.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.69.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.69.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.69.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.69.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.69.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.7.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.7.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.7.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.7.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.7.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.7.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.70.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.70.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.70.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.70.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.70.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.70.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.71.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.71.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.71.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.71.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.71.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.71.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.72.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.72.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.72.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.72.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.72.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.72.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.73.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.73.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.73.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.73.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.73.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.73.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.74.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.74.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.74.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.74.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.74.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.74.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.75.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.75.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.75.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.75.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.75.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.75.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.76.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.76.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.76.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.76.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.76.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.76.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.77.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.77.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.77.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.77.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.77.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.77.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.78.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.78.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.78.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.78.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.78.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.78.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.79.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.79.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.79.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.79.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.79.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.79.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.8.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.8.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.8.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.8.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.8.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.8.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.80.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.80.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.80.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.80.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.80.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.80.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.81.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.81.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.81.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.81.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.81.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.81.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.82.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.82.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.82.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.82.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.82.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.82.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.83.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.83.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.83.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.83.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.83.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.83.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.84.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.84.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.84.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.84.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.84.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.84.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.85.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.85.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.85.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.85.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.85.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.85.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.86.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.86.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.86.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.86.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.86.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.86.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.87.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.87.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.87.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.87.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.87.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.87.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.88.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.88.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.88.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.88.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.88.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.88.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.89.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.89.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.89.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.89.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.89.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.89.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.9.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.9.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.9.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.9.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.9.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.9.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.90.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.90.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.90.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.90.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.90.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.90.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.91.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.91.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.91.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.91.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.91.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.91.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.92.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.92.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.92.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.92.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.92.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.92.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.93.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.93.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.93.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.93.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.93.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.93.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.94.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.94.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.94.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.94.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.94.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.94.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.95.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.95.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.95.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.95.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.95.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.95.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.96.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.96.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.96.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.96.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.96.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.96.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.97.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.97.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.97.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.97.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.97.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.97.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.98.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.98.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.98.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.98.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.98.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.98.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.99.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.99.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.99.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.99.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.99.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.experts.99.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.gate.e_score_correction_bias": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.gate.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.shared_experts.down_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.shared_experts.down_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.shared_experts.gate_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.shared_experts.gate_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.shared_experts.up_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.mlp.shared_experts.up_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.post_attention_layernorm.weight": "model-00041-of-00092.safetensors", + "model.layers.40.self_attn.k_norm.weight": "model-00041-of-00092.safetensors", + "model.layers.40.self_attn.k_proj.bias": "model-00041-of-00092.safetensors", + "model.layers.40.self_attn.k_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.self_attn.k_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.self_attn.o_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.self_attn.o_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.self_attn.q_norm.weight": "model-00041-of-00092.safetensors", + "model.layers.40.self_attn.q_proj.bias": "model-00041-of-00092.safetensors", + "model.layers.40.self_attn.q_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.self_attn.q_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.40.self_attn.v_proj.bias": "model-00041-of-00092.safetensors", + "model.layers.40.self_attn.v_proj.weight": "model-00041-of-00092.safetensors", + "model.layers.40.self_attn.v_proj.weight_scale": "model-00041-of-00092.safetensors", + "model.layers.41.input_layernorm.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.0.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.0.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.0.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.0.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.0.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.0.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.1.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.1.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.1.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.1.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.1.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.1.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.10.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.10.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.10.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.10.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.10.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.10.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.100.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.100.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.100.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.100.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.100.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.100.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.101.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.101.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.101.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.101.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.101.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.101.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.102.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.102.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.102.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.102.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.102.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.102.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.103.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.103.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.103.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.103.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.103.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.103.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.104.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.104.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.104.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.104.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.104.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.104.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.105.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.105.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.105.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.105.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.105.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.105.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.106.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.106.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.106.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.106.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.106.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.106.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.107.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.107.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.107.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.107.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.107.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.107.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.108.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.108.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.108.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.108.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.108.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.108.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.109.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.109.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.109.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.109.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.109.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.109.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.11.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.11.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.11.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.11.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.11.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.11.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.110.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.110.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.110.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.110.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.110.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.110.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.111.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.111.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.111.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.111.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.111.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.111.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.112.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.112.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.112.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.112.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.112.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.112.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.113.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.113.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.113.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.113.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.113.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.113.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.114.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.114.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.114.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.114.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.114.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.114.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.115.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.115.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.115.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.115.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.115.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.115.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.116.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.116.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.116.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.116.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.116.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.116.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.117.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.117.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.117.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.117.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.117.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.117.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.118.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.118.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.118.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.118.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.118.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.118.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.119.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.119.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.119.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.119.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.119.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.119.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.12.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.12.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.12.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.12.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.12.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.12.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.120.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.120.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.120.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.120.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.120.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.120.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.121.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.121.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.121.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.121.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.121.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.121.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.122.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.122.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.122.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.122.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.122.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.122.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.123.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.123.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.123.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.123.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.123.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.123.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.124.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.124.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.124.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.124.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.124.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.124.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.125.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.125.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.125.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.125.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.125.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.125.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.126.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.126.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.126.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.126.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.126.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.126.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.127.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.127.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.127.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.127.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.127.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.127.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.128.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.128.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.128.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.128.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.128.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.128.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.129.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.129.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.129.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.129.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.129.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.129.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.13.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.13.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.13.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.13.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.13.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.13.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.130.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.130.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.130.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.130.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.130.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.130.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.131.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.131.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.131.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.131.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.131.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.131.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.132.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.132.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.132.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.132.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.132.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.132.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.133.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.133.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.133.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.133.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.133.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.133.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.134.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.134.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.134.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.134.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.134.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.134.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.135.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.135.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.135.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.135.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.135.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.135.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.136.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.136.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.136.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.136.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.136.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.136.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.137.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.137.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.137.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.137.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.137.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.137.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.138.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.138.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.138.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.138.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.138.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.138.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.139.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.139.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.139.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.139.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.139.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.139.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.14.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.14.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.14.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.14.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.14.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.14.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.140.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.140.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.140.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.140.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.140.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.140.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.141.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.141.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.141.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.141.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.141.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.141.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.142.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.142.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.142.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.142.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.142.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.142.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.143.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.143.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.143.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.143.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.143.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.143.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.144.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.144.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.144.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.144.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.144.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.144.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.145.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.145.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.145.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.145.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.145.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.145.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.146.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.146.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.146.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.146.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.146.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.146.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.147.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.147.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.147.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.147.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.147.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.147.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.148.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.148.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.148.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.148.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.148.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.148.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.149.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.149.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.149.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.149.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.149.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.149.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.15.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.15.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.15.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.15.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.15.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.15.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.150.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.150.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.150.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.150.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.150.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.150.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.151.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.151.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.151.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.151.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.151.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.151.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.152.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.152.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.152.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.152.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.152.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.152.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.153.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.153.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.153.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.153.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.153.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.153.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.154.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.154.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.154.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.154.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.154.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.154.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.155.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.155.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.155.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.155.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.155.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.155.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.156.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.156.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.156.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.156.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.156.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.156.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.157.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.157.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.157.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.157.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.157.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.157.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.158.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.158.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.158.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.158.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.158.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.158.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.159.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.159.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.159.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.159.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.159.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.159.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.16.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.16.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.16.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.16.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.16.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.16.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.17.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.17.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.17.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.17.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.17.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.17.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.18.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.18.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.18.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.18.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.18.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.18.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.19.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.19.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.19.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.19.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.19.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.19.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.2.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.2.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.2.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.2.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.2.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.2.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.20.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.20.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.20.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.20.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.20.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.20.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.21.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.21.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.21.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.21.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.21.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.21.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.22.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.22.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.22.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.22.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.22.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.22.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.23.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.23.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.23.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.23.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.23.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.23.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.24.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.24.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.24.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.24.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.24.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.24.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.25.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.25.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.25.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.25.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.25.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.25.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.26.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.26.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.26.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.26.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.26.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.26.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.27.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.27.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.27.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.27.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.27.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.27.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.28.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.28.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.28.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.28.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.28.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.28.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.29.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.29.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.29.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.29.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.29.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.29.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.3.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.3.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.3.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.3.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.3.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.3.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.30.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.30.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.30.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.30.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.30.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.30.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.31.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.31.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.31.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.31.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.31.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.31.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.32.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.32.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.32.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.32.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.32.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.32.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.33.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.33.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.33.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.33.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.33.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.33.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.34.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.34.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.34.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.34.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.34.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.34.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.35.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.35.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.35.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.35.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.35.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.35.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.36.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.36.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.36.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.36.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.36.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.36.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.37.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.37.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.37.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.37.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.37.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.37.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.38.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.38.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.38.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.38.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.38.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.38.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.39.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.39.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.39.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.39.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.39.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.39.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.4.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.4.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.4.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.4.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.4.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.4.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.40.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.40.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.40.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.40.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.40.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.40.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.41.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.41.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.41.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.41.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.41.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.41.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.42.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.42.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.42.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.42.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.42.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.42.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.43.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.43.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.43.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.43.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.43.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.43.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.44.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.44.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.44.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.44.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.44.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.44.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.45.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.45.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.45.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.45.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.45.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.45.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.46.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.46.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.46.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.46.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.46.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.46.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.47.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.47.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.47.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.47.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.47.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.47.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.48.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.48.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.48.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.48.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.48.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.48.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.49.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.49.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.49.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.49.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.49.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.49.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.5.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.5.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.5.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.5.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.5.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.5.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.50.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.50.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.50.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.50.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.50.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.50.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.51.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.51.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.51.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.51.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.51.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.51.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.52.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.52.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.52.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.52.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.52.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.52.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.53.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.53.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.53.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.53.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.53.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.53.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.54.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.54.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.54.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.54.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.54.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.54.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.55.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.55.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.55.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.55.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.55.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.55.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.56.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.56.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.56.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.56.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.56.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.56.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.57.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.57.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.57.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.57.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.57.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.57.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.58.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.58.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.58.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.58.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.58.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.58.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.59.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.59.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.59.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.59.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.59.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.59.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.6.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.6.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.6.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.6.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.6.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.6.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.60.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.60.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.60.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.60.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.60.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.60.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.61.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.61.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.61.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.61.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.61.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.61.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.62.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.62.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.62.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.62.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.62.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.62.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.63.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.63.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.63.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.63.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.63.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.63.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.64.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.64.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.64.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.64.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.64.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.64.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.65.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.65.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.65.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.65.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.65.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.65.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.66.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.66.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.66.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.66.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.66.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.66.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.67.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.67.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.67.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.67.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.67.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.67.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.68.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.68.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.68.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.68.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.68.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.68.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.69.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.69.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.69.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.69.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.69.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.69.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.7.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.7.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.7.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.7.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.7.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.7.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.70.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.70.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.70.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.70.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.70.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.70.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.71.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.71.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.71.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.71.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.71.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.71.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.72.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.72.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.72.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.72.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.72.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.72.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.73.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.73.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.73.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.73.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.73.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.73.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.74.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.74.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.74.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.74.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.74.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.74.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.75.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.75.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.75.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.75.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.75.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.75.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.76.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.76.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.76.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.76.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.76.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.76.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.77.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.77.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.77.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.77.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.77.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.77.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.78.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.78.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.78.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.78.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.78.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.78.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.79.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.79.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.79.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.79.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.79.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.79.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.8.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.8.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.8.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.8.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.8.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.8.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.80.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.80.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.80.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.80.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.80.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.80.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.81.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.81.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.81.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.81.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.81.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.81.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.82.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.82.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.82.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.82.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.82.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.82.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.83.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.83.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.83.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.83.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.83.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.83.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.84.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.84.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.84.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.84.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.84.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.84.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.85.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.85.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.85.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.85.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.85.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.85.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.86.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.86.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.86.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.86.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.86.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.86.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.87.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.87.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.87.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.87.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.87.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.87.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.88.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.88.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.88.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.88.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.88.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.88.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.89.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.89.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.89.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.89.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.89.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.89.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.9.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.9.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.9.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.9.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.9.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.9.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.90.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.90.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.90.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.90.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.90.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.90.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.91.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.91.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.91.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.91.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.91.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.91.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.92.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.92.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.92.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.92.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.92.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.92.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.93.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.93.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.93.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.93.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.93.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.93.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.94.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.94.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.94.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.94.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.94.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.94.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.95.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.95.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.95.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.95.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.95.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.95.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.96.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.96.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.96.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.96.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.96.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.96.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.97.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.97.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.97.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.97.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.97.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.97.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.98.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.98.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.98.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.98.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.98.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.98.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.99.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.99.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.99.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.99.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.99.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.experts.99.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.gate.e_score_correction_bias": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.gate.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.shared_experts.down_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.shared_experts.down_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.shared_experts.gate_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.shared_experts.gate_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.shared_experts.up_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.mlp.shared_experts.up_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.post_attention_layernorm.weight": "model-00042-of-00092.safetensors", + "model.layers.41.self_attn.k_norm.weight": "model-00042-of-00092.safetensors", + "model.layers.41.self_attn.k_proj.bias": "model-00042-of-00092.safetensors", + "model.layers.41.self_attn.k_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.self_attn.k_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.self_attn.o_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.self_attn.o_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.self_attn.q_norm.weight": "model-00042-of-00092.safetensors", + "model.layers.41.self_attn.q_proj.bias": "model-00042-of-00092.safetensors", + "model.layers.41.self_attn.q_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.self_attn.q_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.41.self_attn.v_proj.bias": "model-00042-of-00092.safetensors", + "model.layers.41.self_attn.v_proj.weight": "model-00042-of-00092.safetensors", + "model.layers.41.self_attn.v_proj.weight_scale": "model-00042-of-00092.safetensors", + "model.layers.42.input_layernorm.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.0.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.0.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.0.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.0.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.0.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.0.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.1.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.1.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.1.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.1.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.1.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.1.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.10.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.10.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.10.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.10.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.10.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.10.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.100.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.100.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.100.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.100.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.100.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.100.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.101.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.101.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.101.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.101.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.101.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.101.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.102.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.102.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.102.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.102.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.102.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.102.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.103.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.103.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.103.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.103.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.103.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.103.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.104.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.104.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.104.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.104.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.104.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.104.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.105.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.105.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.105.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.105.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.105.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.105.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.106.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.106.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.106.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.106.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.106.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.106.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.107.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.107.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.107.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.107.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.107.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.107.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.108.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.108.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.108.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.108.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.108.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.108.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.109.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.109.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.109.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.109.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.109.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.109.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.11.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.11.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.11.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.11.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.11.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.11.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.110.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.110.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.110.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.110.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.110.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.110.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.111.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.111.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.111.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.111.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.111.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.111.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.112.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.112.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.112.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.112.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.112.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.112.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.113.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.113.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.113.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.113.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.113.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.113.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.114.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.114.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.114.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.114.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.114.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.114.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.115.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.115.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.115.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.115.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.115.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.115.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.116.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.116.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.116.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.116.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.116.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.116.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.117.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.117.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.117.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.117.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.117.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.117.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.118.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.118.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.118.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.118.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.118.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.118.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.119.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.119.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.119.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.119.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.119.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.119.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.12.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.12.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.12.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.12.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.12.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.12.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.120.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.120.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.120.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.120.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.120.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.120.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.121.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.121.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.121.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.121.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.121.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.121.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.122.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.122.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.122.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.122.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.122.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.122.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.123.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.123.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.123.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.123.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.123.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.123.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.124.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.124.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.124.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.124.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.124.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.124.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.125.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.125.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.125.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.125.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.125.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.125.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.126.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.126.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.126.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.126.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.126.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.126.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.127.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.127.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.127.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.127.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.127.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.127.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.128.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.128.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.128.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.128.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.128.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.128.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.129.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.129.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.129.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.129.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.129.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.129.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.13.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.13.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.13.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.13.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.13.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.13.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.130.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.130.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.130.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.130.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.130.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.130.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.131.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.131.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.131.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.131.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.131.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.131.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.132.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.132.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.132.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.132.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.132.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.132.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.133.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.133.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.133.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.133.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.133.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.133.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.134.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.134.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.134.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.134.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.134.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.134.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.135.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.135.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.135.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.135.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.135.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.135.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.136.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.136.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.136.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.136.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.136.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.136.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.137.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.137.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.137.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.137.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.137.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.137.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.138.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.138.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.138.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.138.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.138.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.138.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.139.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.139.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.139.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.139.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.139.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.139.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.14.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.14.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.14.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.14.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.14.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.14.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.140.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.140.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.140.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.140.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.140.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.140.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.141.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.141.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.141.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.141.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.141.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.141.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.142.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.142.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.142.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.142.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.142.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.142.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.143.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.143.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.143.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.143.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.143.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.143.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.144.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.144.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.144.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.144.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.144.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.144.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.145.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.145.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.145.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.145.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.145.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.145.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.146.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.146.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.146.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.146.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.146.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.146.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.147.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.147.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.147.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.147.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.147.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.147.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.148.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.148.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.148.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.148.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.148.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.148.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.149.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.149.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.149.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.149.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.149.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.149.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.15.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.15.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.15.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.15.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.15.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.15.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.150.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.150.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.150.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.150.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.150.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.150.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.151.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.151.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.151.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.151.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.151.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.151.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.152.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.152.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.152.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.152.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.152.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.152.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.153.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.153.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.153.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.153.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.153.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.153.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.154.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.154.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.154.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.154.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.154.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.154.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.155.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.155.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.155.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.155.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.155.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.155.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.156.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.156.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.156.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.156.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.156.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.156.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.157.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.157.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.157.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.157.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.157.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.157.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.158.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.158.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.158.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.158.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.158.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.158.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.159.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.159.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.159.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.159.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.159.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.159.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.16.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.16.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.16.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.16.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.16.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.16.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.17.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.17.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.17.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.17.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.17.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.17.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.18.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.18.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.18.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.18.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.18.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.18.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.19.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.19.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.19.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.19.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.19.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.19.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.2.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.2.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.2.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.2.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.2.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.2.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.20.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.20.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.20.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.20.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.20.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.20.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.21.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.21.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.21.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.21.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.21.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.21.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.22.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.22.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.22.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.22.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.22.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.22.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.23.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.23.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.23.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.23.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.23.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.23.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.24.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.24.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.24.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.24.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.24.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.24.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.25.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.25.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.25.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.25.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.25.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.25.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.26.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.26.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.26.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.26.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.26.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.26.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.27.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.27.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.27.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.27.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.27.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.27.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.28.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.28.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.28.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.28.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.28.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.28.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.29.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.29.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.29.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.29.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.29.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.29.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.3.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.3.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.3.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.3.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.3.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.3.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.30.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.30.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.30.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.30.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.30.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.30.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.31.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.31.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.31.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.31.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.31.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.31.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.32.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.32.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.32.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.32.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.32.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.32.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.33.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.33.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.33.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.33.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.33.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.33.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.34.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.34.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.34.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.34.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.34.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.34.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.35.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.35.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.35.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.35.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.35.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.35.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.36.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.36.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.36.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.36.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.36.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.36.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.37.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.37.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.37.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.37.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.37.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.37.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.38.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.38.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.38.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.38.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.38.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.38.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.39.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.39.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.39.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.39.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.39.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.39.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.4.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.4.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.4.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.4.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.4.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.4.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.40.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.40.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.40.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.40.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.40.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.40.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.41.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.41.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.41.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.41.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.41.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.41.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.42.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.42.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.42.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.42.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.42.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.42.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.43.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.43.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.43.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.43.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.43.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.43.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.44.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.44.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.44.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.44.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.44.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.44.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.45.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.45.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.45.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.45.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.45.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.45.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.46.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.46.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.46.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.46.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.46.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.46.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.47.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.47.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.47.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.47.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.47.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.47.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.48.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.48.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.48.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.48.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.48.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.48.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.49.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.49.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.49.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.49.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.49.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.49.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.5.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.5.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.5.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.5.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.5.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.5.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.50.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.50.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.50.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.50.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.50.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.50.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.51.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.51.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.51.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.51.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.51.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.51.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.52.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.52.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.52.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.52.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.52.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.52.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.53.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.53.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.53.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.53.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.53.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.53.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.54.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.54.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.54.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.54.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.54.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.54.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.55.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.55.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.55.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.55.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.55.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.55.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.56.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.56.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.56.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.56.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.56.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.56.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.57.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.57.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.57.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.57.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.57.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.57.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.58.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.58.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.58.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.58.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.58.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.58.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.59.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.59.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.59.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.59.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.59.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.59.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.6.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.6.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.6.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.6.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.6.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.6.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.60.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.60.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.60.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.60.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.60.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.60.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.61.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.61.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.61.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.61.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.61.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.61.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.62.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.62.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.62.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.62.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.62.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.62.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.63.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.63.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.63.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.63.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.63.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.63.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.64.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.64.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.64.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.64.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.64.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.64.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.65.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.65.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.65.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.65.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.65.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.65.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.66.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.66.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.66.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.66.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.66.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.66.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.67.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.67.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.67.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.67.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.67.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.67.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.68.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.68.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.68.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.68.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.68.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.68.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.69.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.69.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.69.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.69.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.69.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.69.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.7.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.7.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.7.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.7.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.7.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.7.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.70.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.70.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.70.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.70.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.70.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.70.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.71.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.71.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.71.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.71.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.71.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.71.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.72.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.72.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.72.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.72.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.72.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.72.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.73.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.73.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.73.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.73.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.73.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.73.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.74.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.74.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.74.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.74.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.74.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.74.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.75.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.75.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.75.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.75.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.75.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.75.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.76.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.76.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.76.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.76.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.76.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.76.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.77.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.77.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.77.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.77.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.77.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.77.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.78.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.78.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.78.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.78.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.78.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.78.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.79.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.79.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.79.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.79.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.79.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.79.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.8.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.8.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.8.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.8.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.8.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.8.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.80.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.80.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.80.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.80.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.80.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.80.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.81.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.81.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.81.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.81.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.81.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.81.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.82.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.82.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.82.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.82.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.82.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.82.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.83.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.83.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.83.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.83.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.83.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.83.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.84.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.84.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.84.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.84.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.84.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.84.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.85.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.85.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.85.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.85.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.85.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.85.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.86.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.86.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.86.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.86.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.86.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.86.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.87.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.87.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.87.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.87.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.87.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.87.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.88.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.88.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.88.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.88.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.88.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.88.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.89.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.89.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.89.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.89.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.89.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.89.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.9.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.9.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.9.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.9.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.9.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.9.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.90.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.90.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.90.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.90.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.90.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.90.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.91.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.91.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.91.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.91.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.91.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.91.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.92.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.92.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.92.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.92.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.92.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.92.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.93.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.93.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.93.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.93.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.93.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.93.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.94.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.94.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.94.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.94.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.94.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.94.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.95.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.95.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.95.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.95.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.95.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.95.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.96.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.96.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.96.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.96.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.96.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.96.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.97.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.97.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.97.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.97.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.97.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.97.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.98.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.98.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.98.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.98.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.98.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.98.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.99.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.99.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.99.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.99.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.99.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.experts.99.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.gate.e_score_correction_bias": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.gate.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.shared_experts.down_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.shared_experts.down_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.shared_experts.gate_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.shared_experts.gate_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.shared_experts.up_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.mlp.shared_experts.up_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.post_attention_layernorm.weight": "model-00043-of-00092.safetensors", + "model.layers.42.self_attn.k_norm.weight": "model-00043-of-00092.safetensors", + "model.layers.42.self_attn.k_proj.bias": "model-00043-of-00092.safetensors", + "model.layers.42.self_attn.k_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.self_attn.k_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.self_attn.o_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.self_attn.o_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.self_attn.q_norm.weight": "model-00043-of-00092.safetensors", + "model.layers.42.self_attn.q_proj.bias": "model-00043-of-00092.safetensors", + "model.layers.42.self_attn.q_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.self_attn.q_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.42.self_attn.v_proj.bias": "model-00043-of-00092.safetensors", + "model.layers.42.self_attn.v_proj.weight": "model-00043-of-00092.safetensors", + "model.layers.42.self_attn.v_proj.weight_scale": "model-00043-of-00092.safetensors", + "model.layers.43.input_layernorm.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.0.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.0.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.0.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.0.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.0.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.0.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.1.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.1.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.1.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.1.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.1.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.1.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.10.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.10.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.10.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.10.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.10.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.10.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.100.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.100.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.100.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.100.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.100.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.100.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.101.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.101.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.101.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.101.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.101.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.101.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.102.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.102.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.102.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.102.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.102.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.102.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.103.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.103.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.103.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.103.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.103.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.103.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.104.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.104.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.104.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.104.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.104.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.104.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.105.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.105.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.105.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.105.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.105.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.105.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.106.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.106.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.106.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.106.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.106.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.106.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.107.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.107.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.107.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.107.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.107.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.107.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.108.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.108.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.108.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.108.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.108.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.108.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.109.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.109.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.109.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.109.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.109.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.109.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.11.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.11.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.11.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.11.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.11.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.11.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.110.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.110.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.110.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.110.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.110.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.110.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.111.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.111.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.111.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.111.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.111.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.111.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.112.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.112.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.112.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.112.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.112.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.112.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.113.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.113.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.113.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.113.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.113.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.113.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.114.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.114.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.114.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.114.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.114.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.114.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.115.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.115.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.115.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.115.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.115.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.115.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.116.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.116.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.116.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.116.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.116.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.116.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.117.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.117.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.117.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.117.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.117.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.117.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.118.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.118.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.118.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.118.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.118.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.118.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.119.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.119.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.119.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.119.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.119.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.119.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.12.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.12.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.12.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.12.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.12.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.12.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.120.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.120.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.120.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.120.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.120.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.120.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.121.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.121.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.121.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.121.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.121.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.121.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.122.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.122.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.122.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.122.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.122.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.122.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.123.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.123.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.123.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.123.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.123.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.123.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.124.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.124.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.124.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.124.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.124.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.124.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.125.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.125.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.125.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.125.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.125.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.125.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.126.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.126.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.126.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.126.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.126.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.126.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.127.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.127.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.127.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.127.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.127.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.127.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.128.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.128.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.128.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.128.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.128.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.128.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.129.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.129.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.129.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.129.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.129.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.129.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.13.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.13.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.13.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.13.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.13.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.13.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.130.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.130.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.130.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.130.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.130.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.130.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.131.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.131.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.131.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.131.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.131.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.131.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.132.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.132.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.132.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.132.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.132.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.132.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.133.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.133.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.133.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.133.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.133.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.133.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.134.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.134.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.134.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.134.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.134.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.134.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.135.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.135.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.135.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.135.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.135.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.135.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.136.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.136.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.136.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.136.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.136.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.136.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.137.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.137.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.137.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.137.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.137.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.137.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.138.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.138.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.138.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.138.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.138.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.138.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.139.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.139.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.139.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.139.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.139.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.139.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.14.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.14.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.14.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.14.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.14.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.14.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.140.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.140.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.140.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.140.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.140.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.140.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.141.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.141.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.141.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.141.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.141.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.141.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.142.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.142.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.142.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.142.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.142.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.142.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.143.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.143.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.143.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.143.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.143.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.143.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.144.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.144.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.144.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.144.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.144.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.144.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.145.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.145.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.145.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.145.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.145.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.145.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.146.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.146.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.146.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.146.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.146.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.146.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.147.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.147.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.147.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.147.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.147.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.147.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.148.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.148.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.148.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.148.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.148.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.148.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.149.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.149.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.149.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.149.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.149.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.149.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.15.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.15.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.15.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.15.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.15.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.15.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.150.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.150.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.150.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.150.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.150.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.150.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.151.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.151.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.151.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.151.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.151.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.151.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.152.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.152.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.152.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.152.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.152.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.152.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.153.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.153.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.153.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.153.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.153.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.153.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.154.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.154.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.154.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.154.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.154.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.154.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.155.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.155.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.155.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.155.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.155.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.155.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.156.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.156.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.156.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.156.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.156.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.156.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.157.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.157.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.157.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.157.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.157.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.157.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.158.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.158.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.158.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.158.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.158.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.158.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.159.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.159.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.159.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.159.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.159.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.159.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.16.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.16.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.16.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.16.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.16.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.16.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.17.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.17.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.17.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.17.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.17.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.17.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.18.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.18.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.18.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.18.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.18.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.18.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.19.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.19.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.19.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.19.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.19.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.19.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.2.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.2.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.2.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.2.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.2.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.2.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.20.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.20.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.20.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.20.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.20.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.20.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.21.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.21.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.21.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.21.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.21.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.21.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.22.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.22.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.22.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.22.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.22.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.22.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.23.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.23.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.23.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.23.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.23.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.23.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.24.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.24.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.24.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.24.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.24.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.24.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.25.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.25.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.25.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.25.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.25.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.25.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.26.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.26.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.26.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.26.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.26.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.26.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.27.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.27.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.27.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.27.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.27.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.27.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.28.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.28.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.28.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.28.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.28.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.28.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.29.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.29.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.29.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.29.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.29.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.29.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.3.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.3.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.3.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.3.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.3.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.3.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.30.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.30.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.30.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.30.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.30.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.30.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.31.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.31.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.31.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.31.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.31.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.31.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.32.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.32.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.32.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.32.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.32.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.32.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.33.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.33.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.33.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.33.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.33.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.33.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.34.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.34.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.34.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.34.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.34.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.34.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.35.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.35.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.35.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.35.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.35.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.35.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.36.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.36.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.36.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.36.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.36.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.36.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.37.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.37.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.37.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.37.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.37.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.37.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.38.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.38.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.38.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.38.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.38.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.38.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.39.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.39.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.39.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.39.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.39.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.39.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.4.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.4.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.4.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.4.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.4.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.4.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.40.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.40.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.40.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.40.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.40.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.40.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.41.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.41.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.41.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.41.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.41.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.41.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.42.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.42.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.42.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.42.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.42.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.42.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.43.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.43.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.43.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.43.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.43.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.43.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.44.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.44.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.44.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.44.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.44.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.44.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.45.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.45.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.45.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.45.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.45.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.45.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.46.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.46.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.46.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.46.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.46.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.46.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.47.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.47.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.47.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.47.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.47.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.47.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.48.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.48.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.48.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.48.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.48.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.48.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.49.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.49.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.49.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.49.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.49.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.49.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.5.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.5.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.5.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.5.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.5.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.5.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.50.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.50.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.50.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.50.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.50.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.50.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.51.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.51.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.51.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.51.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.51.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.51.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.52.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.52.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.52.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.52.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.52.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.52.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.53.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.53.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.53.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.53.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.53.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.53.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.54.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.54.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.54.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.54.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.54.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.54.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.55.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.55.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.55.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.55.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.55.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.55.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.56.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.56.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.56.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.56.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.56.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.56.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.57.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.57.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.57.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.57.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.57.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.57.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.58.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.58.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.58.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.58.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.58.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.58.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.59.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.59.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.59.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.59.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.59.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.59.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.6.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.6.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.6.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.6.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.6.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.6.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.60.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.60.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.60.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.60.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.60.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.60.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.61.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.61.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.61.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.61.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.61.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.61.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.62.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.62.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.62.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.62.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.62.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.62.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.63.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.63.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.63.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.63.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.63.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.63.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.64.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.64.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.64.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.64.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.64.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.64.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.65.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.65.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.65.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.65.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.65.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.65.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.66.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.66.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.66.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.66.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.66.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.66.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.67.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.67.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.67.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.67.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.67.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.67.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.68.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.68.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.68.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.68.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.68.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.68.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.69.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.69.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.69.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.69.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.69.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.69.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.7.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.7.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.7.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.7.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.7.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.7.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.70.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.70.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.70.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.70.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.70.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.70.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.71.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.71.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.71.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.71.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.71.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.71.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.72.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.72.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.72.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.72.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.72.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.72.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.73.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.73.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.73.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.73.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.73.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.73.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.74.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.74.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.74.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.74.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.74.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.74.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.75.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.75.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.75.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.75.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.75.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.75.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.76.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.76.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.76.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.76.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.76.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.76.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.77.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.77.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.77.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.77.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.77.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.77.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.78.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.78.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.78.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.78.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.78.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.78.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.79.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.79.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.79.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.79.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.79.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.79.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.8.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.8.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.8.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.8.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.8.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.8.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.80.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.80.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.80.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.80.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.80.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.80.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.81.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.81.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.81.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.81.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.81.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.81.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.82.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.82.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.82.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.82.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.82.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.82.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.83.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.83.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.83.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.83.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.83.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.83.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.84.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.84.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.84.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.84.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.84.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.84.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.85.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.85.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.85.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.85.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.85.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.85.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.86.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.86.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.86.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.86.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.86.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.86.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.87.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.87.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.87.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.87.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.87.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.87.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.88.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.88.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.88.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.88.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.88.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.88.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.89.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.89.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.89.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.89.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.89.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.89.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.9.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.9.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.9.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.9.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.9.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.9.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.90.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.90.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.90.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.90.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.90.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.90.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.91.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.91.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.91.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.91.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.91.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.91.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.92.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.92.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.92.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.92.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.92.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.92.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.93.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.93.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.93.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.93.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.93.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.93.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.94.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.94.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.94.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.94.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.94.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.94.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.95.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.95.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.95.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.95.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.95.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.95.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.96.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.96.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.96.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.96.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.96.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.96.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.97.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.97.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.97.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.97.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.97.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.97.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.98.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.98.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.98.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.98.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.98.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.98.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.99.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.99.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.99.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.99.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.99.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.experts.99.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.gate.e_score_correction_bias": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.gate.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.shared_experts.down_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.shared_experts.down_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.shared_experts.gate_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.shared_experts.gate_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.shared_experts.up_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.mlp.shared_experts.up_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.post_attention_layernorm.weight": "model-00044-of-00092.safetensors", + "model.layers.43.self_attn.k_norm.weight": "model-00044-of-00092.safetensors", + "model.layers.43.self_attn.k_proj.bias": "model-00044-of-00092.safetensors", + "model.layers.43.self_attn.k_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.self_attn.k_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.self_attn.o_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.self_attn.o_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.self_attn.q_norm.weight": "model-00044-of-00092.safetensors", + "model.layers.43.self_attn.q_proj.bias": "model-00044-of-00092.safetensors", + "model.layers.43.self_attn.q_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.self_attn.q_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.43.self_attn.v_proj.bias": "model-00044-of-00092.safetensors", + "model.layers.43.self_attn.v_proj.weight": "model-00044-of-00092.safetensors", + "model.layers.43.self_attn.v_proj.weight_scale": "model-00044-of-00092.safetensors", + "model.layers.44.input_layernorm.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.0.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.0.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.0.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.0.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.0.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.0.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.1.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.1.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.1.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.1.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.1.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.1.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.10.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.10.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.10.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.10.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.10.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.10.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.100.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.100.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.100.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.100.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.100.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.100.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.101.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.101.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.101.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.101.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.101.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.101.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.102.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.102.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.102.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.102.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.102.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.102.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.103.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.103.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.103.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.103.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.103.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.103.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.104.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.104.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.104.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.104.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.104.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.104.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.105.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.105.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.105.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.105.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.105.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.105.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.106.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.106.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.106.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.106.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.106.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.106.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.107.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.107.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.107.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.107.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.107.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.107.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.108.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.108.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.108.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.108.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.108.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.108.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.109.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.109.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.109.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.109.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.109.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.109.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.11.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.11.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.11.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.11.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.11.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.11.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.110.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.110.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.110.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.110.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.110.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.110.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.111.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.111.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.111.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.111.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.111.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.111.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.112.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.112.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.112.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.112.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.112.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.112.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.113.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.113.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.113.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.113.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.113.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.113.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.114.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.114.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.114.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.114.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.114.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.114.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.115.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.115.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.115.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.115.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.115.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.115.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.116.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.116.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.116.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.116.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.116.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.116.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.117.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.117.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.117.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.117.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.117.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.117.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.118.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.118.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.118.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.118.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.118.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.118.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.119.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.119.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.119.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.119.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.119.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.119.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.12.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.12.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.12.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.12.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.12.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.12.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.120.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.120.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.120.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.120.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.120.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.120.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.121.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.121.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.121.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.121.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.121.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.121.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.122.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.122.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.122.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.122.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.122.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.122.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.123.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.123.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.123.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.123.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.123.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.123.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.124.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.124.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.124.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.124.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.124.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.124.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.125.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.125.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.125.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.125.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.125.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.125.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.126.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.126.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.126.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.126.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.126.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.126.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.127.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.127.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.127.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.127.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.127.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.127.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.128.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.128.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.128.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.128.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.128.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.128.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.129.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.129.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.129.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.129.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.129.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.129.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.13.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.13.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.13.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.13.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.13.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.13.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.130.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.130.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.130.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.130.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.130.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.130.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.131.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.131.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.131.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.131.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.131.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.131.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.132.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.132.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.132.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.132.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.132.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.132.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.133.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.133.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.133.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.133.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.133.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.133.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.134.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.134.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.134.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.134.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.134.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.134.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.135.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.135.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.135.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.135.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.135.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.135.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.136.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.136.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.136.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.136.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.136.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.136.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.137.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.137.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.137.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.137.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.137.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.137.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.138.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.138.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.138.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.138.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.138.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.138.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.139.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.139.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.139.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.139.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.139.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.139.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.14.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.14.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.14.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.14.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.14.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.14.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.140.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.140.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.140.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.140.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.140.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.140.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.141.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.141.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.141.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.141.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.141.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.141.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.142.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.142.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.142.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.142.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.142.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.142.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.143.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.143.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.143.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.143.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.143.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.143.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.144.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.144.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.144.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.144.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.144.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.144.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.145.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.145.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.145.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.145.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.145.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.145.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.146.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.146.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.146.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.146.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.146.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.146.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.147.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.147.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.147.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.147.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.147.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.147.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.148.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.148.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.148.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.148.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.148.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.148.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.149.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.149.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.149.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.149.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.149.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.149.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.15.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.15.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.15.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.15.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.15.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.15.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.150.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.150.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.150.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.150.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.150.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.150.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.151.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.151.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.151.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.151.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.151.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.151.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.152.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.152.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.152.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.152.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.152.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.152.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.153.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.153.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.153.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.153.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.153.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.153.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.154.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.154.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.154.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.154.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.154.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.154.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.155.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.155.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.155.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.155.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.155.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.155.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.156.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.156.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.156.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.156.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.156.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.156.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.157.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.157.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.157.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.157.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.157.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.157.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.158.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.158.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.158.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.158.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.158.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.158.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.159.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.159.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.159.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.159.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.159.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.159.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.16.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.16.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.16.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.16.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.16.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.16.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.17.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.17.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.17.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.17.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.17.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.17.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.18.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.18.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.18.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.18.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.18.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.18.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.19.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.19.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.19.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.19.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.19.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.19.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.2.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.2.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.2.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.2.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.2.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.2.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.20.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.20.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.20.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.20.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.20.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.20.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.21.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.21.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.21.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.21.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.21.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.21.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.22.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.22.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.22.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.22.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.22.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.22.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.23.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.23.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.23.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.23.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.23.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.23.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.24.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.24.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.24.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.24.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.24.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.24.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.25.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.25.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.25.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.25.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.25.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.25.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.26.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.26.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.26.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.26.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.26.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.26.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.27.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.27.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.27.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.27.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.27.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.27.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.28.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.28.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.28.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.28.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.28.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.28.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.29.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.29.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.29.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.29.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.29.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.29.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.3.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.3.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.3.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.3.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.3.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.3.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.30.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.30.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.30.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.30.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.30.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.30.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.31.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.31.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.31.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.31.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.31.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.31.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.32.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.32.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.32.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.32.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.32.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.32.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.33.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.33.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.33.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.33.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.33.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.33.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.34.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.34.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.34.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.34.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.34.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.34.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.35.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.35.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.35.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.35.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.35.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.35.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.36.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.36.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.36.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.36.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.36.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.36.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.37.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.37.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.37.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.37.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.37.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.37.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.38.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.38.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.38.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.38.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.38.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.38.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.39.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.39.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.39.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.39.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.39.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.39.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.4.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.4.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.4.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.4.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.4.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.4.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.40.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.40.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.40.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.40.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.40.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.40.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.41.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.41.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.41.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.41.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.41.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.41.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.42.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.42.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.42.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.42.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.42.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.42.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.43.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.43.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.43.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.43.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.43.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.43.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.44.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.44.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.44.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.44.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.44.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.44.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.45.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.45.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.45.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.45.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.45.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.45.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.46.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.46.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.46.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.46.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.46.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.46.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.47.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.47.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.47.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.47.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.47.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.47.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.48.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.48.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.48.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.48.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.48.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.48.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.49.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.49.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.49.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.49.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.49.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.49.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.5.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.5.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.5.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.5.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.5.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.5.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.50.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.50.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.50.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.50.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.50.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.50.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.51.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.51.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.51.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.51.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.51.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.51.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.52.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.52.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.52.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.52.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.52.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.52.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.53.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.53.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.53.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.53.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.53.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.53.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.54.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.54.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.54.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.54.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.54.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.54.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.55.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.55.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.55.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.55.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.55.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.55.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.56.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.56.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.56.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.56.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.56.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.56.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.57.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.57.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.57.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.57.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.57.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.57.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.58.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.58.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.58.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.58.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.58.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.58.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.59.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.59.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.59.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.59.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.59.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.59.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.6.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.6.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.6.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.6.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.6.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.6.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.60.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.60.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.60.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.60.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.60.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.60.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.61.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.61.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.61.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.61.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.61.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.61.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.62.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.62.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.62.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.62.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.62.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.62.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.63.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.63.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.63.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.63.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.63.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.63.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.64.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.64.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.64.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.64.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.64.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.64.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.65.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.65.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.65.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.65.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.65.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.65.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.66.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.66.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.66.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.66.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.66.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.66.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.67.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.67.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.67.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.67.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.67.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.67.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.68.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.68.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.68.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.68.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.68.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.68.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.69.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.69.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.69.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.69.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.69.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.69.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.7.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.7.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.7.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.7.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.7.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.7.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.70.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.70.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.70.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.70.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.70.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.70.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.71.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.71.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.71.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.71.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.71.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.71.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.72.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.72.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.72.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.72.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.72.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.72.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.73.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.73.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.73.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.73.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.73.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.73.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.74.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.74.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.74.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.74.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.74.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.74.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.75.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.75.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.75.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.75.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.75.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.75.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.76.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.76.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.76.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.76.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.76.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.76.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.77.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.77.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.77.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.77.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.77.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.77.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.78.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.78.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.78.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.78.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.78.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.78.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.79.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.79.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.79.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.79.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.79.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.79.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.8.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.8.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.8.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.8.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.8.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.8.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.80.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.80.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.80.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.80.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.80.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.80.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.81.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.81.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.81.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.81.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.81.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.81.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.82.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.82.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.82.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.82.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.82.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.82.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.83.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.83.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.83.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.83.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.83.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.83.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.84.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.84.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.84.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.84.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.84.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.84.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.85.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.85.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.85.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.85.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.85.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.85.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.86.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.86.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.86.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.86.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.86.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.86.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.87.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.87.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.87.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.87.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.87.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.87.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.88.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.88.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.88.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.88.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.88.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.88.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.89.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.89.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.89.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.89.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.89.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.89.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.9.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.9.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.9.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.9.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.9.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.9.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.90.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.90.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.90.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.90.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.90.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.90.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.91.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.91.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.91.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.91.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.91.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.91.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.92.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.92.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.92.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.92.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.92.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.92.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.93.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.93.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.93.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.93.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.93.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.93.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.94.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.94.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.94.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.94.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.94.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.94.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.95.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.95.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.95.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.95.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.95.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.95.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.96.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.96.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.96.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.96.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.96.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.96.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.97.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.97.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.97.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.97.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.97.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.97.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.98.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.98.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.98.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.98.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.98.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.98.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.99.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.99.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.99.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.99.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.99.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.experts.99.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.gate.e_score_correction_bias": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.gate.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.shared_experts.down_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.shared_experts.down_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.shared_experts.gate_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.shared_experts.gate_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.shared_experts.up_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.mlp.shared_experts.up_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.post_attention_layernorm.weight": "model-00045-of-00092.safetensors", + "model.layers.44.self_attn.k_norm.weight": "model-00045-of-00092.safetensors", + "model.layers.44.self_attn.k_proj.bias": "model-00045-of-00092.safetensors", + "model.layers.44.self_attn.k_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.self_attn.k_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.self_attn.o_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.self_attn.o_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.self_attn.q_norm.weight": "model-00045-of-00092.safetensors", + "model.layers.44.self_attn.q_proj.bias": "model-00045-of-00092.safetensors", + "model.layers.44.self_attn.q_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.self_attn.q_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.44.self_attn.v_proj.bias": "model-00045-of-00092.safetensors", + "model.layers.44.self_attn.v_proj.weight": "model-00045-of-00092.safetensors", + "model.layers.44.self_attn.v_proj.weight_scale": "model-00045-of-00092.safetensors", + "model.layers.45.input_layernorm.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.0.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.0.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.0.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.0.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.0.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.0.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.1.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.1.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.1.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.1.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.1.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.1.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.10.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.10.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.10.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.10.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.10.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.10.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.100.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.100.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.100.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.100.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.100.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.100.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.101.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.101.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.101.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.101.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.101.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.101.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.102.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.102.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.102.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.102.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.102.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.102.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.103.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.103.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.103.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.103.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.103.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.103.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.104.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.104.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.104.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.104.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.104.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.104.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.105.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.105.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.105.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.105.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.105.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.105.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.106.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.106.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.106.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.106.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.106.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.106.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.107.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.107.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.107.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.107.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.107.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.107.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.108.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.108.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.108.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.108.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.108.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.108.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.109.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.109.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.109.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.109.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.109.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.109.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.11.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.11.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.11.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.11.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.11.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.11.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.110.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.110.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.110.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.110.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.110.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.110.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.111.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.111.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.111.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.111.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.111.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.111.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.112.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.112.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.112.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.112.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.112.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.112.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.113.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.113.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.113.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.113.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.113.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.113.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.114.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.114.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.114.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.114.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.114.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.114.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.115.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.115.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.115.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.115.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.115.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.115.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.116.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.116.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.116.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.116.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.116.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.116.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.117.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.117.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.117.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.117.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.117.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.117.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.118.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.118.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.118.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.118.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.118.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.118.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.119.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.119.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.119.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.119.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.119.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.119.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.12.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.12.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.12.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.12.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.12.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.12.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.120.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.120.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.120.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.120.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.120.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.120.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.121.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.121.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.121.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.121.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.121.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.121.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.122.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.122.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.122.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.122.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.122.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.122.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.123.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.123.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.123.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.123.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.123.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.123.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.124.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.124.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.124.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.124.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.124.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.124.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.125.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.125.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.125.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.125.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.125.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.125.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.126.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.126.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.126.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.126.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.126.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.126.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.127.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.127.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.127.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.127.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.127.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.127.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.128.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.128.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.128.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.128.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.128.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.128.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.129.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.129.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.129.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.129.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.129.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.129.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.13.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.13.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.13.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.13.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.13.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.13.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.130.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.130.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.130.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.130.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.130.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.130.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.131.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.131.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.131.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.131.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.131.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.131.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.132.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.132.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.132.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.132.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.132.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.132.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.133.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.133.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.133.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.133.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.133.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.133.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.134.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.134.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.134.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.134.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.134.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.134.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.135.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.135.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.135.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.135.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.135.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.135.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.136.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.136.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.136.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.136.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.136.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.136.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.137.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.137.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.137.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.137.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.137.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.137.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.138.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.138.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.138.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.138.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.138.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.138.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.139.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.139.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.139.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.139.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.139.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.139.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.14.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.14.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.14.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.14.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.14.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.14.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.140.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.140.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.140.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.140.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.140.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.140.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.141.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.141.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.141.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.141.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.141.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.141.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.142.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.142.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.142.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.142.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.142.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.142.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.143.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.143.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.143.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.143.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.143.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.143.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.144.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.144.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.144.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.144.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.144.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.144.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.145.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.145.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.145.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.145.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.145.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.145.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.146.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.146.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.146.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.146.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.146.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.146.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.147.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.147.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.147.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.147.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.147.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.147.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.148.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.148.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.148.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.148.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.148.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.148.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.149.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.149.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.149.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.149.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.149.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.149.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.15.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.15.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.15.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.15.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.15.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.15.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.150.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.150.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.150.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.150.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.150.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.150.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.151.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.151.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.151.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.151.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.151.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.151.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.152.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.152.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.152.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.152.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.152.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.152.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.153.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.153.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.153.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.153.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.153.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.153.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.154.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.154.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.154.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.154.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.154.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.154.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.155.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.155.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.155.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.155.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.155.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.155.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.156.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.156.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.156.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.156.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.156.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.156.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.157.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.157.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.157.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.157.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.157.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.157.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.158.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.158.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.158.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.158.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.158.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.158.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.159.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.159.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.159.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.159.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.159.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.159.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.16.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.16.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.16.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.16.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.16.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.16.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.17.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.17.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.17.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.17.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.17.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.17.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.18.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.18.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.18.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.18.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.18.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.18.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.19.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.19.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.19.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.19.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.19.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.19.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.2.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.2.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.2.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.2.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.2.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.2.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.20.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.20.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.20.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.20.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.20.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.20.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.21.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.21.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.21.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.21.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.21.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.21.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.22.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.22.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.22.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.22.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.22.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.22.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.23.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.23.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.23.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.23.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.23.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.23.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.24.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.24.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.24.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.24.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.24.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.24.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.25.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.25.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.25.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.25.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.25.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.25.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.26.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.26.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.26.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.26.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.26.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.26.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.27.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.27.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.27.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.27.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.27.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.27.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.28.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.28.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.28.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.28.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.28.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.28.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.29.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.29.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.29.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.29.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.29.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.29.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.3.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.3.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.3.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.3.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.3.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.3.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.30.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.30.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.30.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.30.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.30.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.30.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.31.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.31.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.31.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.31.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.31.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.31.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.32.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.32.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.32.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.32.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.32.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.32.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.33.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.33.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.33.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.33.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.33.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.33.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.34.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.34.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.34.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.34.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.34.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.34.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.35.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.35.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.35.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.35.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.35.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.35.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.36.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.36.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.36.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.36.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.36.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.36.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.37.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.37.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.37.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.37.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.37.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.37.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.38.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.38.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.38.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.38.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.38.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.38.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.39.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.39.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.39.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.39.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.39.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.39.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.4.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.4.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.4.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.4.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.4.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.4.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.40.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.40.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.40.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.40.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.40.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.40.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.41.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.41.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.41.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.41.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.41.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.41.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.42.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.42.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.42.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.42.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.42.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.42.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.43.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.43.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.43.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.43.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.43.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.43.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.44.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.44.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.44.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.44.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.44.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.44.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.45.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.45.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.45.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.45.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.45.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.45.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.46.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.46.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.46.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.46.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.46.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.46.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.47.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.47.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.47.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.47.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.47.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.47.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.48.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.48.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.48.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.48.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.48.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.48.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.49.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.49.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.49.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.49.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.49.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.49.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.5.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.5.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.5.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.5.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.5.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.5.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.50.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.50.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.50.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.50.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.50.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.50.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.51.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.51.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.51.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.51.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.51.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.51.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.52.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.52.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.52.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.52.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.52.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.52.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.53.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.53.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.53.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.53.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.53.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.53.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.54.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.54.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.54.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.54.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.54.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.54.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.55.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.55.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.55.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.55.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.55.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.55.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.56.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.56.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.56.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.56.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.56.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.56.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.57.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.57.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.57.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.57.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.57.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.57.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.58.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.58.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.58.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.58.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.58.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.58.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.59.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.59.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.59.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.59.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.59.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.59.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.6.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.6.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.6.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.6.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.6.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.6.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.60.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.60.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.60.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.60.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.60.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.60.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.61.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.61.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.61.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.61.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.61.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.61.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.62.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.62.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.62.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.62.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.62.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.62.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.63.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.63.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.63.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.63.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.63.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.63.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.64.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.64.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.64.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.64.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.64.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.64.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.65.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.65.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.65.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.65.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.65.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.65.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.66.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.66.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.66.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.66.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.66.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.66.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.67.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.67.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.67.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.67.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.67.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.67.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.68.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.68.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.68.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.68.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.68.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.68.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.69.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.69.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.69.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.69.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.69.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.69.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.7.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.7.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.7.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.7.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.7.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.7.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.70.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.70.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.70.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.70.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.70.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.70.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.71.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.71.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.71.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.71.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.71.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.71.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.72.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.72.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.72.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.72.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.72.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.72.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.73.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.73.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.73.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.73.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.73.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.73.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.74.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.74.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.74.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.74.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.74.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.74.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.75.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.75.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.75.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.75.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.75.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.75.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.76.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.76.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.76.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.76.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.76.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.76.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.77.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.77.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.77.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.77.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.77.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.77.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.78.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.78.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.78.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.78.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.78.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.78.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.79.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.79.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.79.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.79.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.79.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.79.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.8.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.8.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.8.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.8.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.8.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.8.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.80.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.80.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.80.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.80.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.80.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.80.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.81.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.81.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.81.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.81.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.81.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.81.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.82.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.82.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.82.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.82.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.82.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.82.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.83.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.83.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.83.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.83.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.83.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.83.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.84.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.84.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.84.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.84.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.84.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.84.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.85.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.85.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.85.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.85.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.85.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.85.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.86.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.86.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.86.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.86.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.86.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.86.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.87.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.87.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.87.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.87.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.87.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.87.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.88.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.88.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.88.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.88.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.88.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.88.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.89.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.89.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.89.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.89.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.89.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.89.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.9.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.9.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.9.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.9.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.9.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.9.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.90.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.90.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.90.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.90.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.90.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.90.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.91.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.91.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.91.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.91.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.91.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.91.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.92.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.92.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.92.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.92.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.92.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.92.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.93.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.93.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.93.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.93.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.93.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.93.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.94.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.94.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.94.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.94.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.94.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.94.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.95.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.95.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.95.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.95.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.95.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.95.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.96.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.96.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.96.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.96.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.96.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.96.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.97.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.97.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.97.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.97.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.97.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.97.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.98.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.98.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.98.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.98.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.98.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.98.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.99.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.99.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.99.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.99.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.99.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.experts.99.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.gate.e_score_correction_bias": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.gate.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.shared_experts.down_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.shared_experts.down_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.shared_experts.gate_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.shared_experts.gate_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.shared_experts.up_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.mlp.shared_experts.up_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.post_attention_layernorm.weight": "model-00046-of-00092.safetensors", + "model.layers.45.self_attn.k_norm.weight": "model-00046-of-00092.safetensors", + "model.layers.45.self_attn.k_proj.bias": "model-00046-of-00092.safetensors", + "model.layers.45.self_attn.k_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.self_attn.k_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.self_attn.o_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.self_attn.o_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.self_attn.q_norm.weight": "model-00046-of-00092.safetensors", + "model.layers.45.self_attn.q_proj.bias": "model-00046-of-00092.safetensors", + "model.layers.45.self_attn.q_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.self_attn.q_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.45.self_attn.v_proj.bias": "model-00046-of-00092.safetensors", + "model.layers.45.self_attn.v_proj.weight": "model-00046-of-00092.safetensors", + "model.layers.45.self_attn.v_proj.weight_scale": "model-00046-of-00092.safetensors", + "model.layers.46.input_layernorm.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.0.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.0.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.0.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.0.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.0.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.0.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.1.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.1.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.1.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.1.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.1.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.1.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.10.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.10.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.10.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.10.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.10.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.10.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.100.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.100.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.100.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.100.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.100.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.100.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.101.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.101.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.101.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.101.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.101.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.101.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.102.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.102.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.102.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.102.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.102.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.102.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.103.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.103.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.103.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.103.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.103.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.103.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.104.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.104.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.104.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.104.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.104.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.104.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.105.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.105.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.105.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.105.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.105.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.105.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.106.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.106.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.106.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.106.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.106.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.106.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.107.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.107.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.107.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.107.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.107.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.107.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.108.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.108.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.108.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.108.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.108.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.108.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.109.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.109.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.109.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.109.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.109.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.109.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.11.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.11.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.11.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.11.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.11.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.11.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.110.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.110.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.110.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.110.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.110.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.110.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.111.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.111.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.111.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.111.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.111.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.111.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.112.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.112.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.112.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.112.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.112.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.112.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.113.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.113.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.113.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.113.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.113.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.113.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.114.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.114.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.114.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.114.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.114.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.114.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.115.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.115.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.115.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.115.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.115.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.115.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.116.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.116.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.116.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.116.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.116.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.116.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.117.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.117.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.117.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.117.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.117.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.117.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.118.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.118.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.118.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.118.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.118.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.118.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.119.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.119.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.119.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.119.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.119.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.119.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.12.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.12.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.12.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.12.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.12.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.12.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.120.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.120.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.120.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.120.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.120.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.120.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.121.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.121.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.121.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.121.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.121.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.121.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.122.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.122.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.122.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.122.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.122.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.122.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.123.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.123.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.123.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.123.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.123.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.123.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.124.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.124.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.124.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.124.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.124.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.124.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.125.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.125.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.125.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.125.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.125.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.125.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.126.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.126.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.126.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.126.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.126.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.126.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.127.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.127.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.127.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.127.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.127.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.127.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.128.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.128.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.128.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.128.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.128.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.128.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.129.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.129.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.129.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.129.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.129.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.129.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.13.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.13.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.13.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.13.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.13.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.13.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.130.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.130.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.130.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.130.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.130.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.130.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.131.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.131.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.131.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.131.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.131.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.131.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.132.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.132.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.132.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.132.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.132.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.132.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.133.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.133.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.133.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.133.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.133.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.133.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.134.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.134.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.134.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.134.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.134.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.134.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.135.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.135.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.135.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.135.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.135.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.135.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.136.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.136.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.136.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.136.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.136.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.136.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.137.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.137.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.137.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.137.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.137.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.137.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.138.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.138.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.138.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.138.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.138.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.138.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.139.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.139.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.139.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.139.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.139.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.139.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.14.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.14.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.14.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.14.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.14.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.14.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.140.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.140.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.140.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.140.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.140.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.140.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.141.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.141.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.141.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.141.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.141.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.141.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.142.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.142.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.142.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.142.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.142.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.142.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.143.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.143.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.143.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.143.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.143.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.143.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.144.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.144.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.144.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.144.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.144.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.144.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.145.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.145.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.145.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.145.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.145.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.145.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.146.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.146.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.146.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.146.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.146.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.146.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.147.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.147.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.147.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.147.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.147.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.147.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.148.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.148.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.148.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.148.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.148.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.148.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.149.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.149.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.149.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.149.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.149.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.149.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.15.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.15.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.15.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.15.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.15.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.15.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.150.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.150.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.150.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.150.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.150.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.150.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.151.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.151.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.151.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.151.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.151.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.151.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.152.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.152.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.152.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.152.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.152.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.152.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.153.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.153.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.153.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.153.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.153.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.153.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.154.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.154.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.154.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.154.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.154.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.154.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.155.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.155.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.155.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.155.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.155.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.155.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.156.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.156.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.156.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.156.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.156.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.156.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.157.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.157.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.157.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.157.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.157.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.157.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.158.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.158.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.158.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.158.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.158.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.158.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.159.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.159.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.159.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.159.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.159.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.159.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.16.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.16.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.16.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.16.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.16.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.16.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.17.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.17.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.17.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.17.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.17.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.17.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.18.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.18.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.18.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.18.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.18.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.18.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.19.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.19.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.19.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.19.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.19.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.19.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.2.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.2.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.2.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.2.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.2.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.2.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.20.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.20.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.20.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.20.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.20.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.20.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.21.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.21.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.21.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.21.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.21.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.21.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.22.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.22.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.22.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.22.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.22.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.22.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.23.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.23.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.23.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.23.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.23.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.23.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.24.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.24.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.24.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.24.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.24.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.24.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.25.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.25.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.25.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.25.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.25.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.25.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.26.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.26.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.26.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.26.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.26.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.26.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.27.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.27.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.27.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.27.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.27.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.27.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.28.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.28.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.28.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.28.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.28.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.28.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.29.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.29.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.29.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.29.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.29.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.29.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.3.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.3.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.3.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.3.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.3.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.3.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.30.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.30.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.30.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.30.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.30.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.30.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.31.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.31.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.31.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.31.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.31.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.31.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.32.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.32.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.32.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.32.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.32.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.32.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.33.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.33.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.33.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.33.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.33.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.33.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.34.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.34.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.34.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.34.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.34.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.34.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.35.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.35.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.35.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.35.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.35.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.35.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.36.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.36.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.36.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.36.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.36.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.36.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.37.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.37.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.37.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.37.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.37.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.37.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.38.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.38.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.38.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.38.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.38.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.38.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.39.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.39.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.39.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.39.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.39.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.39.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.4.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.4.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.4.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.4.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.4.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.4.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.40.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.40.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.40.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.40.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.40.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.40.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.41.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.41.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.41.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.41.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.41.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.41.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.42.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.42.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.42.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.42.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.42.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.42.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.43.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.43.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.43.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.43.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.43.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.43.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.44.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.44.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.44.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.44.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.44.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.44.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.45.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.45.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.45.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.45.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.45.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.45.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.46.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.46.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.46.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.46.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.46.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.46.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.47.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.47.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.47.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.47.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.47.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.47.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.48.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.48.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.48.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.48.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.48.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.48.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.49.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.49.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.49.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.49.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.49.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.49.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.5.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.5.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.5.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.5.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.5.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.5.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.50.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.50.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.50.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.50.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.50.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.50.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.51.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.51.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.51.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.51.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.51.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.51.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.52.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.52.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.52.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.52.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.52.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.52.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.53.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.53.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.53.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.53.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.53.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.53.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.54.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.54.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.54.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.54.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.54.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.54.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.55.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.55.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.55.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.55.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.55.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.55.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.56.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.56.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.56.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.56.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.56.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.56.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.57.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.57.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.57.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.57.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.57.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.57.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.58.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.58.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.58.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.58.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.58.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.58.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.59.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.59.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.59.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.59.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.59.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.59.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.6.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.6.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.6.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.6.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.6.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.6.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.60.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.60.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.60.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.60.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.60.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.60.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.61.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.61.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.61.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.61.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.61.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.61.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.62.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.62.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.62.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.62.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.62.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.62.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.63.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.63.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.63.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.63.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.63.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.63.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.64.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.64.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.64.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.64.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.64.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.64.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.65.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.65.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.65.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.65.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.65.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.65.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.66.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.66.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.66.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.66.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.66.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.66.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.67.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.67.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.67.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.67.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.67.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.67.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.68.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.68.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.68.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.68.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.68.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.68.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.69.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.69.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.69.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.69.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.69.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.69.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.7.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.7.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.7.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.7.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.7.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.7.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.70.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.70.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.70.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.70.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.70.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.70.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.71.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.71.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.71.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.71.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.71.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.71.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.72.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.72.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.72.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.72.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.72.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.72.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.73.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.73.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.73.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.73.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.73.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.73.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.74.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.74.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.74.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.74.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.74.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.74.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.75.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.75.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.75.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.75.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.75.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.75.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.76.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.76.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.76.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.76.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.76.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.76.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.77.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.77.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.77.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.77.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.77.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.77.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.78.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.78.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.78.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.78.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.78.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.78.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.79.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.79.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.79.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.79.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.79.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.79.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.8.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.8.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.8.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.8.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.8.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.8.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.80.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.80.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.80.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.80.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.80.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.80.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.81.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.81.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.81.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.81.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.81.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.81.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.82.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.82.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.82.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.82.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.82.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.82.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.83.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.83.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.83.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.83.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.83.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.83.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.84.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.84.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.84.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.84.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.84.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.84.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.85.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.85.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.85.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.85.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.85.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.85.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.86.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.86.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.86.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.86.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.86.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.86.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.87.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.87.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.87.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.87.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.87.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.87.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.88.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.88.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.88.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.88.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.88.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.88.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.89.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.89.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.89.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.89.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.89.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.89.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.9.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.9.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.9.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.9.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.9.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.9.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.90.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.90.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.90.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.90.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.90.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.90.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.91.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.91.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.91.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.91.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.91.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.91.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.92.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.92.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.92.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.92.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.92.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.92.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.93.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.93.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.93.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.93.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.93.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.93.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.94.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.94.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.94.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.94.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.94.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.94.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.95.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.95.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.95.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.95.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.95.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.95.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.96.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.96.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.96.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.96.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.96.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.96.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.97.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.97.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.97.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.97.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.97.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.97.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.98.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.98.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.98.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.98.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.98.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.98.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.99.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.99.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.99.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.99.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.99.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.experts.99.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.gate.e_score_correction_bias": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.gate.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.shared_experts.down_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.shared_experts.down_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.shared_experts.gate_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.shared_experts.gate_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.shared_experts.up_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.mlp.shared_experts.up_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.post_attention_layernorm.weight": "model-00047-of-00092.safetensors", + "model.layers.46.self_attn.k_norm.weight": "model-00047-of-00092.safetensors", + "model.layers.46.self_attn.k_proj.bias": "model-00047-of-00092.safetensors", + "model.layers.46.self_attn.k_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.self_attn.k_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.self_attn.o_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.self_attn.o_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.self_attn.q_norm.weight": "model-00047-of-00092.safetensors", + "model.layers.46.self_attn.q_proj.bias": "model-00047-of-00092.safetensors", + "model.layers.46.self_attn.q_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.self_attn.q_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.46.self_attn.v_proj.bias": "model-00047-of-00092.safetensors", + "model.layers.46.self_attn.v_proj.weight": "model-00047-of-00092.safetensors", + "model.layers.46.self_attn.v_proj.weight_scale": "model-00047-of-00092.safetensors", + "model.layers.47.input_layernorm.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.0.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.0.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.0.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.0.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.0.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.0.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.1.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.1.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.1.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.1.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.1.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.1.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.10.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.10.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.10.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.10.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.10.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.10.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.100.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.100.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.100.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.100.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.100.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.100.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.101.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.101.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.101.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.101.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.101.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.101.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.102.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.102.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.102.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.102.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.102.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.102.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.103.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.103.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.103.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.103.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.103.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.103.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.104.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.104.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.104.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.104.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.104.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.104.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.105.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.105.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.105.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.105.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.105.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.105.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.106.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.106.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.106.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.106.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.106.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.106.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.107.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.107.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.107.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.107.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.107.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.107.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.108.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.108.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.108.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.108.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.108.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.108.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.109.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.109.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.109.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.109.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.109.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.109.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.11.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.11.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.11.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.11.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.11.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.11.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.110.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.110.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.110.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.110.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.110.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.110.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.111.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.111.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.111.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.111.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.111.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.111.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.112.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.112.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.112.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.112.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.112.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.112.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.113.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.113.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.113.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.113.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.113.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.113.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.114.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.114.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.114.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.114.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.114.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.114.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.115.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.115.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.115.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.115.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.115.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.115.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.116.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.116.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.116.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.116.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.116.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.116.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.117.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.117.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.117.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.117.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.117.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.117.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.118.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.118.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.118.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.118.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.118.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.118.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.119.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.119.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.119.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.119.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.119.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.119.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.12.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.12.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.12.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.12.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.12.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.12.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.120.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.120.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.120.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.120.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.120.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.120.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.121.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.121.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.121.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.121.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.121.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.121.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.122.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.122.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.122.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.122.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.122.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.122.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.123.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.123.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.123.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.123.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.123.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.123.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.124.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.124.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.124.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.124.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.124.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.124.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.125.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.125.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.125.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.125.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.125.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.125.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.126.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.126.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.126.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.126.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.126.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.126.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.127.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.127.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.127.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.127.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.127.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.127.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.128.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.128.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.128.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.128.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.128.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.128.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.129.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.129.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.129.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.129.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.129.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.129.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.13.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.13.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.13.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.13.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.13.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.13.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.130.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.130.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.130.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.130.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.130.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.130.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.131.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.131.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.131.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.131.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.131.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.131.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.132.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.132.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.132.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.132.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.132.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.132.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.133.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.133.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.133.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.133.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.133.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.133.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.134.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.134.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.134.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.134.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.134.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.134.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.135.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.135.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.135.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.135.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.135.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.135.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.136.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.136.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.136.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.136.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.136.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.136.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.137.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.137.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.137.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.137.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.137.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.137.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.138.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.138.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.138.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.138.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.138.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.138.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.139.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.139.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.139.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.139.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.139.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.139.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.14.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.14.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.14.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.14.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.14.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.14.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.140.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.140.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.140.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.140.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.140.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.140.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.141.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.141.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.141.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.141.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.141.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.141.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.142.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.142.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.142.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.142.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.142.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.142.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.143.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.143.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.143.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.143.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.143.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.143.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.144.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.144.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.144.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.144.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.144.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.144.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.145.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.145.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.145.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.145.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.145.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.145.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.146.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.146.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.146.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.146.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.146.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.146.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.147.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.147.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.147.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.147.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.147.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.147.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.148.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.148.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.148.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.148.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.148.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.148.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.149.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.149.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.149.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.149.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.149.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.149.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.15.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.15.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.15.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.15.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.15.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.15.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.150.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.150.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.150.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.150.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.150.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.150.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.151.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.151.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.151.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.151.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.151.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.151.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.152.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.152.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.152.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.152.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.152.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.152.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.153.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.153.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.153.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.153.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.153.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.153.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.154.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.154.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.154.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.154.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.154.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.154.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.155.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.155.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.155.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.155.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.155.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.155.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.156.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.156.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.156.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.156.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.156.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.156.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.157.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.157.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.157.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.157.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.157.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.157.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.158.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.158.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.158.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.158.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.158.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.158.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.159.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.159.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.159.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.159.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.159.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.159.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.16.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.16.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.16.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.16.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.16.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.16.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.17.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.17.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.17.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.17.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.17.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.17.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.18.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.18.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.18.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.18.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.18.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.18.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.19.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.19.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.19.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.19.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.19.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.19.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.2.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.2.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.2.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.2.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.2.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.2.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.20.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.20.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.20.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.20.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.20.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.20.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.21.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.21.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.21.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.21.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.21.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.21.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.22.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.22.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.22.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.22.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.22.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.22.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.23.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.23.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.23.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.23.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.23.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.23.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.24.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.24.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.24.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.24.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.24.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.24.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.25.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.25.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.25.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.25.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.25.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.25.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.26.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.26.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.26.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.26.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.26.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.26.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.27.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.27.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.27.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.27.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.27.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.27.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.28.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.28.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.28.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.28.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.28.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.28.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.29.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.29.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.29.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.29.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.29.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.29.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.3.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.3.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.3.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.3.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.3.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.3.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.30.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.30.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.30.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.30.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.30.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.30.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.31.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.31.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.31.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.31.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.31.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.31.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.32.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.32.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.32.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.32.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.32.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.32.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.33.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.33.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.33.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.33.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.33.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.33.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.34.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.34.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.34.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.34.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.34.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.34.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.35.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.35.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.35.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.35.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.35.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.35.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.36.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.36.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.36.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.36.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.36.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.36.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.37.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.37.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.37.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.37.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.37.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.37.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.38.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.38.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.38.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.38.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.38.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.38.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.39.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.39.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.39.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.39.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.39.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.39.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.4.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.4.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.4.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.4.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.4.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.4.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.40.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.40.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.40.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.40.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.40.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.40.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.41.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.41.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.41.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.41.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.41.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.41.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.42.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.42.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.42.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.42.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.42.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.42.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.43.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.43.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.43.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.43.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.43.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.43.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.44.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.44.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.44.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.44.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.44.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.44.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.45.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.45.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.45.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.45.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.45.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.45.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.46.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.46.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.46.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.46.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.46.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.46.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.47.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.47.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.47.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.47.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.47.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.47.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.48.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.48.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.48.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.48.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.48.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.48.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.49.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.49.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.49.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.49.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.49.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.49.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.5.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.5.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.5.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.5.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.5.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.5.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.50.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.50.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.50.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.50.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.50.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.50.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.51.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.51.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.51.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.51.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.51.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.51.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.52.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.52.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.52.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.52.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.52.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.52.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.53.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.53.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.53.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.53.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.53.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.53.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.54.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.54.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.54.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.54.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.54.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.54.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.55.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.55.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.55.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.55.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.55.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.55.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.56.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.56.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.56.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.56.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.56.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.56.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.57.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.57.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.57.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.57.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.57.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.57.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.58.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.58.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.58.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.58.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.58.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.58.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.59.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.59.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.59.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.59.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.59.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.59.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.6.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.6.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.6.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.6.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.6.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.6.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.60.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.60.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.60.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.60.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.60.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.60.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.61.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.61.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.61.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.61.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.61.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.61.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.62.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.62.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.62.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.62.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.62.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.62.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.63.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.63.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.63.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.63.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.63.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.63.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.64.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.64.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.64.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.64.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.64.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.64.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.65.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.65.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.65.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.65.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.65.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.65.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.66.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.66.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.66.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.66.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.66.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.66.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.67.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.67.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.67.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.67.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.67.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.67.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.68.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.68.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.68.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.68.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.68.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.68.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.69.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.69.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.69.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.69.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.69.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.69.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.7.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.7.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.7.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.7.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.7.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.7.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.70.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.70.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.70.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.70.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.70.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.70.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.71.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.71.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.71.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.71.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.71.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.71.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.72.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.72.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.72.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.72.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.72.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.72.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.73.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.73.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.73.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.73.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.73.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.73.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.74.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.74.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.74.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.74.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.74.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.74.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.75.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.75.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.75.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.75.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.75.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.75.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.76.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.76.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.76.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.76.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.76.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.76.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.77.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.77.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.77.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.77.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.77.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.77.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.78.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.78.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.78.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.78.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.78.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.78.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.79.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.79.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.79.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.79.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.79.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.79.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.8.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.8.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.8.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.8.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.8.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.8.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.80.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.80.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.80.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.80.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.80.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.80.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.81.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.81.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.81.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.81.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.81.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.81.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.82.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.82.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.82.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.82.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.82.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.82.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.83.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.83.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.83.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.83.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.83.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.83.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.84.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.84.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.84.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.84.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.84.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.84.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.85.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.85.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.85.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.85.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.85.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.85.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.86.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.86.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.86.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.86.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.86.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.86.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.87.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.87.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.87.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.87.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.87.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.87.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.88.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.88.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.88.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.88.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.88.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.88.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.89.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.89.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.89.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.89.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.89.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.89.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.9.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.9.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.9.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.9.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.9.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.9.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.90.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.90.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.90.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.90.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.90.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.90.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.91.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.91.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.91.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.91.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.91.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.91.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.92.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.92.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.92.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.92.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.92.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.92.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.93.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.93.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.93.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.93.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.93.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.93.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.94.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.94.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.94.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.94.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.94.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.94.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.95.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.95.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.95.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.95.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.95.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.95.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.96.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.96.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.96.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.96.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.96.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.96.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.97.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.97.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.97.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.97.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.97.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.97.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.98.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.98.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.98.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.98.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.98.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.98.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.99.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.99.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.99.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.99.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.99.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.experts.99.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.gate.e_score_correction_bias": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.gate.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.shared_experts.down_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.shared_experts.down_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.shared_experts.gate_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.shared_experts.gate_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.shared_experts.up_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.mlp.shared_experts.up_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.post_attention_layernorm.weight": "model-00048-of-00092.safetensors", + "model.layers.47.self_attn.k_norm.weight": "model-00048-of-00092.safetensors", + "model.layers.47.self_attn.k_proj.bias": "model-00048-of-00092.safetensors", + "model.layers.47.self_attn.k_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.self_attn.k_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.self_attn.o_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.self_attn.o_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.self_attn.q_norm.weight": "model-00048-of-00092.safetensors", + "model.layers.47.self_attn.q_proj.bias": "model-00048-of-00092.safetensors", + "model.layers.47.self_attn.q_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.self_attn.q_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.47.self_attn.v_proj.bias": "model-00048-of-00092.safetensors", + "model.layers.47.self_attn.v_proj.weight": "model-00048-of-00092.safetensors", + "model.layers.47.self_attn.v_proj.weight_scale": "model-00048-of-00092.safetensors", + "model.layers.48.input_layernorm.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.0.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.0.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.0.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.0.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.0.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.0.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.1.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.1.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.1.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.1.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.1.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.1.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.10.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.10.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.10.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.10.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.10.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.10.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.100.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.100.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.100.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.100.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.100.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.100.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.101.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.101.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.101.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.101.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.101.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.101.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.102.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.102.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.102.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.102.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.102.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.102.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.103.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.103.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.103.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.103.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.103.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.103.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.104.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.104.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.104.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.104.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.104.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.104.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.105.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.105.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.105.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.105.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.105.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.105.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.106.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.106.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.106.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.106.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.106.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.106.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.107.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.107.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.107.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.107.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.107.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.107.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.108.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.108.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.108.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.108.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.108.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.108.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.109.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.109.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.109.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.109.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.109.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.109.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.11.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.11.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.11.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.11.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.11.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.11.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.110.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.110.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.110.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.110.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.110.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.110.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.111.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.111.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.111.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.111.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.111.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.111.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.112.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.112.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.112.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.112.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.112.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.112.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.113.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.113.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.113.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.113.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.113.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.113.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.114.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.114.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.114.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.114.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.114.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.114.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.115.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.115.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.115.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.115.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.115.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.115.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.116.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.116.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.116.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.116.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.116.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.116.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.117.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.117.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.117.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.117.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.117.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.117.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.118.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.118.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.118.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.118.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.118.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.118.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.119.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.119.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.119.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.119.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.119.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.119.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.12.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.12.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.12.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.12.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.12.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.12.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.120.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.120.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.120.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.120.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.120.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.120.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.121.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.121.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.121.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.121.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.121.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.121.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.122.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.122.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.122.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.122.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.122.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.122.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.123.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.123.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.123.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.123.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.123.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.123.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.124.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.124.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.124.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.124.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.124.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.124.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.125.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.125.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.125.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.125.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.125.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.125.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.126.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.126.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.126.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.126.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.126.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.126.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.127.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.127.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.127.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.127.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.127.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.127.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.128.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.128.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.128.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.128.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.128.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.128.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.129.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.129.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.129.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.129.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.129.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.129.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.13.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.13.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.13.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.13.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.13.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.13.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.130.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.130.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.130.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.130.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.130.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.130.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.131.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.131.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.131.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.131.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.131.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.131.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.132.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.132.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.132.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.132.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.132.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.132.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.133.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.133.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.133.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.133.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.133.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.133.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.134.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.134.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.134.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.134.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.134.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.134.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.135.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.135.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.135.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.135.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.135.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.135.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.136.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.136.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.136.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.136.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.136.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.136.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.137.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.137.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.137.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.137.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.137.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.137.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.138.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.138.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.138.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.138.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.138.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.138.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.139.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.139.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.139.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.139.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.139.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.139.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.14.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.14.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.14.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.14.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.14.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.14.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.140.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.140.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.140.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.140.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.140.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.140.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.141.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.141.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.141.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.141.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.141.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.141.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.142.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.142.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.142.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.142.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.142.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.142.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.143.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.143.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.143.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.143.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.143.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.143.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.144.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.144.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.144.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.144.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.144.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.144.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.145.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.145.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.145.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.145.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.145.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.145.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.146.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.146.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.146.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.146.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.146.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.146.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.147.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.147.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.147.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.147.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.147.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.147.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.148.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.148.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.148.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.148.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.148.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.148.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.149.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.149.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.149.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.149.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.149.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.149.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.15.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.15.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.15.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.15.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.15.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.15.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.150.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.150.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.150.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.150.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.150.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.150.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.151.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.151.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.151.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.151.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.151.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.151.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.152.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.152.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.152.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.152.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.152.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.152.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.153.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.153.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.153.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.153.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.153.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.153.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.154.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.154.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.154.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.154.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.154.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.154.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.155.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.155.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.155.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.155.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.155.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.155.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.156.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.156.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.156.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.156.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.156.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.156.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.157.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.157.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.157.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.157.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.157.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.157.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.158.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.158.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.158.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.158.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.158.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.158.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.159.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.159.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.159.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.159.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.159.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.159.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.16.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.16.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.16.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.16.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.16.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.16.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.17.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.17.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.17.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.17.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.17.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.17.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.18.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.18.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.18.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.18.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.18.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.18.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.19.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.19.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.19.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.19.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.19.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.19.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.2.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.2.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.2.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.2.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.2.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.2.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.20.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.20.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.20.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.20.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.20.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.20.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.21.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.21.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.21.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.21.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.21.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.21.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.22.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.22.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.22.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.22.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.22.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.22.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.23.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.23.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.23.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.23.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.23.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.23.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.24.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.24.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.24.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.24.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.24.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.24.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.25.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.25.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.25.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.25.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.25.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.25.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.26.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.26.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.26.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.26.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.26.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.26.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.27.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.27.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.27.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.27.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.27.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.27.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.28.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.28.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.28.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.28.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.28.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.28.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.29.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.29.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.29.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.29.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.29.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.29.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.3.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.3.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.3.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.3.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.3.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.3.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.30.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.30.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.30.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.30.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.30.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.30.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.31.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.31.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.31.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.31.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.31.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.31.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.32.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.32.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.32.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.32.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.32.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.32.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.33.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.33.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.33.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.33.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.33.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.33.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.34.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.34.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.34.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.34.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.34.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.34.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.35.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.35.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.35.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.35.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.35.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.35.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.36.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.36.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.36.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.36.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.36.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.36.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.37.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.37.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.37.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.37.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.37.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.37.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.38.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.38.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.38.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.38.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.38.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.38.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.39.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.39.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.39.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.39.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.39.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.39.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.4.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.4.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.4.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.4.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.4.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.4.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.40.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.40.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.40.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.40.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.40.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.40.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.41.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.41.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.41.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.41.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.41.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.41.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.42.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.42.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.42.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.42.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.42.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.42.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.43.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.43.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.43.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.43.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.43.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.43.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.44.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.44.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.44.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.44.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.44.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.44.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.45.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.45.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.45.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.45.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.45.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.45.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.46.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.46.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.46.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.46.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.46.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.46.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.47.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.47.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.47.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.47.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.47.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.47.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.48.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.48.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.48.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.48.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.48.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.48.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.49.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.49.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.49.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.49.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.49.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.49.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.5.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.5.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.5.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.5.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.5.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.5.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.50.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.50.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.50.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.50.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.50.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.50.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.51.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.51.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.51.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.51.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.51.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.51.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.52.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.52.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.52.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.52.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.52.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.52.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.53.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.53.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.53.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.53.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.53.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.53.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.54.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.54.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.54.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.54.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.54.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.54.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.55.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.55.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.55.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.55.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.55.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.55.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.56.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.56.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.56.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.56.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.56.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.56.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.57.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.57.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.57.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.57.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.57.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.57.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.58.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.58.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.58.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.58.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.58.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.58.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.59.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.59.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.59.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.59.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.59.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.59.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.6.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.6.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.6.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.6.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.6.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.6.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.60.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.60.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.60.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.60.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.60.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.60.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.61.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.61.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.61.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.61.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.61.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.61.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.62.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.62.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.62.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.62.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.62.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.62.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.63.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.63.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.63.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.63.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.63.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.63.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.64.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.64.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.64.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.64.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.64.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.64.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.65.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.65.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.65.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.65.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.65.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.65.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.66.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.66.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.66.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.66.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.66.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.66.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.67.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.67.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.67.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.67.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.67.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.67.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.68.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.68.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.68.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.68.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.68.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.68.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.69.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.69.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.69.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.69.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.69.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.69.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.7.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.7.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.7.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.7.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.7.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.7.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.70.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.70.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.70.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.70.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.70.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.70.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.71.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.71.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.71.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.71.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.71.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.71.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.72.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.72.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.72.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.72.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.72.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.72.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.73.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.73.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.73.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.73.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.73.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.73.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.74.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.74.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.74.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.74.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.74.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.74.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.75.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.75.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.75.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.75.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.75.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.75.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.76.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.76.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.76.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.76.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.76.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.76.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.77.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.77.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.77.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.77.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.77.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.77.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.78.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.78.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.78.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.78.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.78.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.78.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.79.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.79.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.79.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.79.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.79.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.79.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.8.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.8.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.8.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.8.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.8.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.8.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.80.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.80.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.80.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.80.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.80.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.80.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.81.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.81.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.81.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.81.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.81.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.81.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.82.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.82.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.82.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.82.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.82.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.82.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.83.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.83.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.83.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.83.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.83.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.83.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.84.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.84.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.84.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.84.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.84.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.84.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.85.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.85.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.85.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.85.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.85.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.85.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.86.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.86.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.86.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.86.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.86.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.86.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.87.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.87.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.87.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.87.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.87.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.87.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.88.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.88.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.88.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.88.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.88.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.88.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.89.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.89.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.89.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.89.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.89.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.89.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.9.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.9.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.9.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.9.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.9.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.9.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.90.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.90.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.90.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.90.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.90.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.90.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.91.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.91.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.91.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.91.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.91.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.91.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.92.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.92.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.92.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.92.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.92.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.92.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.93.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.93.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.93.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.93.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.93.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.93.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.94.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.94.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.94.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.94.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.94.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.94.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.95.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.95.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.95.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.95.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.95.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.95.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.96.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.96.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.96.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.96.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.96.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.96.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.97.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.97.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.97.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.97.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.97.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.97.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.98.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.98.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.98.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.98.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.98.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.98.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.99.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.99.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.99.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.99.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.99.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.experts.99.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.gate.e_score_correction_bias": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.gate.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.shared_experts.down_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.shared_experts.down_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.shared_experts.gate_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.shared_experts.gate_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.shared_experts.up_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.mlp.shared_experts.up_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.post_attention_layernorm.weight": "model-00049-of-00092.safetensors", + "model.layers.48.self_attn.k_norm.weight": "model-00049-of-00092.safetensors", + "model.layers.48.self_attn.k_proj.bias": "model-00049-of-00092.safetensors", + "model.layers.48.self_attn.k_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.self_attn.k_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.self_attn.o_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.self_attn.o_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.self_attn.q_norm.weight": "model-00049-of-00092.safetensors", + "model.layers.48.self_attn.q_proj.bias": "model-00049-of-00092.safetensors", + "model.layers.48.self_attn.q_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.self_attn.q_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.48.self_attn.v_proj.bias": "model-00049-of-00092.safetensors", + "model.layers.48.self_attn.v_proj.weight": "model-00049-of-00092.safetensors", + "model.layers.48.self_attn.v_proj.weight_scale": "model-00049-of-00092.safetensors", + "model.layers.49.input_layernorm.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.0.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.0.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.0.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.0.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.0.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.0.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.1.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.1.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.1.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.1.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.1.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.1.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.10.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.10.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.10.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.10.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.10.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.10.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.100.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.100.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.100.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.100.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.100.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.100.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.101.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.101.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.101.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.101.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.101.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.101.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.102.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.102.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.102.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.102.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.102.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.102.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.103.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.103.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.103.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.103.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.103.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.103.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.104.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.104.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.104.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.104.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.104.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.104.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.105.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.105.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.105.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.105.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.105.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.105.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.106.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.106.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.106.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.106.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.106.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.106.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.107.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.107.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.107.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.107.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.107.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.107.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.108.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.108.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.108.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.108.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.108.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.108.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.109.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.109.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.109.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.109.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.109.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.109.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.11.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.11.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.11.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.11.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.11.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.11.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.110.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.110.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.110.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.110.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.110.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.110.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.111.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.111.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.111.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.111.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.111.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.111.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.112.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.112.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.112.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.112.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.112.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.112.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.113.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.113.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.113.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.113.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.113.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.113.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.114.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.114.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.114.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.114.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.114.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.114.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.115.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.115.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.115.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.115.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.115.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.115.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.116.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.116.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.116.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.116.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.116.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.116.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.117.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.117.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.117.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.117.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.117.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.117.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.118.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.118.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.118.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.118.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.118.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.118.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.119.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.119.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.119.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.119.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.119.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.119.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.12.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.12.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.12.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.12.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.12.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.12.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.120.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.120.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.120.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.120.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.120.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.120.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.121.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.121.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.121.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.121.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.121.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.121.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.122.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.122.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.122.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.122.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.122.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.122.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.123.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.123.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.123.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.123.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.123.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.123.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.124.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.124.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.124.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.124.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.124.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.124.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.125.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.125.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.125.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.125.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.125.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.125.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.126.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.126.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.126.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.126.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.126.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.126.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.127.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.127.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.127.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.127.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.127.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.127.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.128.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.128.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.128.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.128.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.128.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.128.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.129.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.129.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.129.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.129.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.129.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.129.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.13.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.13.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.13.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.13.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.13.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.13.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.130.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.130.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.130.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.130.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.130.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.130.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.131.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.131.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.131.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.131.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.131.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.131.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.132.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.132.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.132.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.132.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.132.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.132.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.133.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.133.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.133.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.133.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.133.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.133.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.134.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.134.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.134.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.134.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.134.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.134.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.135.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.135.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.135.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.135.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.135.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.135.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.136.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.136.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.136.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.136.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.136.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.136.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.137.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.137.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.137.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.137.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.137.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.137.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.138.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.138.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.138.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.138.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.138.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.138.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.139.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.139.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.139.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.139.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.139.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.139.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.14.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.14.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.14.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.14.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.14.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.14.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.140.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.140.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.140.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.140.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.140.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.140.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.141.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.141.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.141.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.141.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.141.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.141.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.142.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.142.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.142.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.142.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.142.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.142.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.143.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.143.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.143.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.143.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.143.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.143.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.144.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.144.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.144.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.144.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.144.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.144.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.145.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.145.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.145.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.145.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.145.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.145.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.146.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.146.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.146.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.146.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.146.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.146.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.147.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.147.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.147.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.147.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.147.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.147.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.148.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.148.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.148.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.148.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.148.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.148.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.149.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.149.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.149.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.149.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.149.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.149.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.15.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.15.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.15.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.15.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.15.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.15.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.150.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.150.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.150.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.150.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.150.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.150.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.151.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.151.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.151.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.151.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.151.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.151.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.152.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.152.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.152.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.152.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.152.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.152.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.153.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.153.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.153.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.153.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.153.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.153.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.154.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.154.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.154.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.154.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.154.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.154.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.155.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.155.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.155.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.155.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.155.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.155.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.156.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.156.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.156.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.156.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.156.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.156.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.157.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.157.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.157.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.157.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.157.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.157.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.158.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.158.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.158.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.158.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.158.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.158.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.159.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.159.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.159.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.159.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.159.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.159.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.16.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.16.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.16.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.16.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.16.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.16.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.17.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.17.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.17.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.17.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.17.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.17.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.18.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.18.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.18.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.18.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.18.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.18.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.19.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.19.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.19.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.19.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.19.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.19.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.2.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.2.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.2.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.2.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.2.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.2.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.20.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.20.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.20.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.20.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.20.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.20.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.21.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.21.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.21.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.21.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.21.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.21.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.22.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.22.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.22.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.22.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.22.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.22.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.23.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.23.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.23.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.23.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.23.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.23.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.24.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.24.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.24.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.24.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.24.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.24.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.25.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.25.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.25.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.25.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.25.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.25.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.26.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.26.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.26.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.26.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.26.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.26.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.27.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.27.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.27.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.27.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.27.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.27.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.28.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.28.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.28.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.28.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.28.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.28.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.29.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.29.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.29.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.29.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.29.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.29.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.3.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.3.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.3.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.3.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.3.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.3.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.30.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.30.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.30.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.30.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.30.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.30.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.31.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.31.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.31.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.31.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.31.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.31.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.32.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.32.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.32.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.32.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.32.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.32.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.33.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.33.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.33.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.33.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.33.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.33.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.34.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.34.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.34.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.34.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.34.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.34.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.35.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.35.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.35.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.35.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.35.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.35.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.36.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.36.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.36.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.36.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.36.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.36.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.37.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.37.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.37.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.37.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.37.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.37.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.38.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.38.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.38.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.38.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.38.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.38.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.39.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.39.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.39.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.39.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.39.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.39.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.4.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.4.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.4.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.4.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.4.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.4.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.40.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.40.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.40.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.40.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.40.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.40.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.41.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.41.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.41.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.41.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.41.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.41.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.42.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.42.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.42.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.42.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.42.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.42.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.43.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.43.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.43.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.43.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.43.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.43.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.44.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.44.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.44.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.44.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.44.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.44.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.45.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.45.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.45.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.45.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.45.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.45.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.46.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.46.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.46.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.46.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.46.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.46.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.47.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.47.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.47.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.47.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.47.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.47.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.48.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.48.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.48.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.48.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.48.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.48.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.49.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.49.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.49.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.49.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.49.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.49.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.5.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.5.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.5.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.5.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.5.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.5.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.50.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.50.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.50.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.50.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.50.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.50.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.51.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.51.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.51.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.51.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.51.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.51.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.52.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.52.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.52.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.52.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.52.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.52.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.53.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.53.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.53.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.53.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.53.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.53.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.54.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.54.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.54.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.54.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.54.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.54.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.55.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.55.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.55.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.55.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.55.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.55.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.56.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.56.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.56.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.56.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.56.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.56.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.57.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.57.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.57.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.57.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.57.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.57.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.58.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.58.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.58.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.58.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.58.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.58.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.59.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.59.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.59.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.59.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.59.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.59.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.6.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.6.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.6.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.6.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.6.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.6.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.60.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.60.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.60.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.60.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.60.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.60.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.61.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.61.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.61.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.61.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.61.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.61.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.62.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.62.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.62.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.62.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.62.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.62.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.63.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.63.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.63.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.63.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.63.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.63.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.64.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.64.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.64.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.64.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.64.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.64.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.65.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.65.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.65.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.65.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.65.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.65.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.66.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.66.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.66.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.66.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.66.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.66.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.67.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.67.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.67.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.67.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.67.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.67.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.68.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.68.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.68.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.68.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.68.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.68.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.69.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.69.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.69.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.69.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.69.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.69.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.7.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.7.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.7.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.7.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.7.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.7.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.70.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.70.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.70.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.70.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.70.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.70.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.71.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.71.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.71.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.71.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.71.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.71.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.72.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.72.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.72.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.72.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.72.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.72.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.73.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.73.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.73.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.73.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.73.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.73.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.74.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.74.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.74.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.74.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.74.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.74.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.75.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.75.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.75.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.75.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.75.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.75.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.76.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.76.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.76.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.76.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.76.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.76.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.77.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.77.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.77.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.77.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.77.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.77.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.78.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.78.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.78.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.78.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.78.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.78.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.79.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.79.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.79.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.79.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.79.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.79.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.8.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.8.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.8.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.8.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.8.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.8.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.80.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.80.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.80.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.80.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.80.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.80.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.81.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.81.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.81.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.81.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.81.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.81.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.82.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.82.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.82.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.82.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.82.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.82.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.83.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.83.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.83.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.83.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.83.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.83.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.84.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.84.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.84.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.84.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.84.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.84.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.85.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.85.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.85.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.85.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.85.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.85.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.86.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.86.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.86.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.86.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.86.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.86.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.87.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.87.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.87.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.87.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.87.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.87.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.88.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.88.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.88.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.88.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.88.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.88.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.89.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.89.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.89.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.89.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.89.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.89.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.9.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.9.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.9.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.9.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.9.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.9.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.90.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.90.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.90.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.90.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.90.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.90.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.91.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.91.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.91.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.91.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.91.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.91.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.92.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.92.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.92.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.92.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.92.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.92.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.93.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.93.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.93.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.93.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.93.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.93.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.94.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.94.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.94.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.94.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.94.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.94.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.95.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.95.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.95.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.95.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.95.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.95.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.96.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.96.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.96.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.96.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.96.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.96.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.97.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.97.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.97.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.97.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.97.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.97.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.98.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.98.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.98.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.98.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.98.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.98.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.99.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.99.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.99.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.99.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.99.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.experts.99.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.gate.e_score_correction_bias": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.gate.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.shared_experts.down_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.shared_experts.down_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.shared_experts.gate_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.shared_experts.gate_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.shared_experts.up_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.mlp.shared_experts.up_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.post_attention_layernorm.weight": "model-00050-of-00092.safetensors", + "model.layers.49.self_attn.k_norm.weight": "model-00050-of-00092.safetensors", + "model.layers.49.self_attn.k_proj.bias": "model-00050-of-00092.safetensors", + "model.layers.49.self_attn.k_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.self_attn.k_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.self_attn.o_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.self_attn.o_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.self_attn.q_norm.weight": "model-00050-of-00092.safetensors", + "model.layers.49.self_attn.q_proj.bias": "model-00050-of-00092.safetensors", + "model.layers.49.self_attn.q_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.self_attn.q_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.49.self_attn.v_proj.bias": "model-00050-of-00092.safetensors", + "model.layers.49.self_attn.v_proj.weight": "model-00050-of-00092.safetensors", + "model.layers.49.self_attn.v_proj.weight_scale": "model-00050-of-00092.safetensors", + "model.layers.50.input_layernorm.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.0.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.0.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.0.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.0.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.0.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.0.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.1.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.1.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.1.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.1.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.1.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.1.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.10.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.10.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.10.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.10.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.10.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.10.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.100.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.100.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.100.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.100.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.100.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.100.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.101.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.101.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.101.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.101.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.101.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.101.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.102.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.102.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.102.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.102.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.102.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.102.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.103.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.103.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.103.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.103.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.103.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.103.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.104.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.104.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.104.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.104.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.104.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.104.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.105.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.105.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.105.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.105.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.105.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.105.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.106.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.106.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.106.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.106.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.106.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.106.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.107.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.107.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.107.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.107.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.107.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.107.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.108.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.108.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.108.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.108.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.108.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.108.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.109.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.109.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.109.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.109.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.109.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.109.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.11.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.11.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.11.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.11.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.11.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.11.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.110.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.110.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.110.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.110.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.110.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.110.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.111.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.111.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.111.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.111.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.111.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.111.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.112.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.112.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.112.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.112.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.112.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.112.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.113.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.113.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.113.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.113.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.113.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.113.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.114.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.114.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.114.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.114.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.114.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.114.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.115.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.115.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.115.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.115.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.115.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.115.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.116.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.116.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.116.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.116.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.116.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.116.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.117.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.117.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.117.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.117.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.117.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.117.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.118.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.118.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.118.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.118.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.118.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.118.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.119.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.119.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.119.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.119.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.119.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.119.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.12.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.12.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.12.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.12.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.12.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.12.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.120.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.120.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.120.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.120.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.120.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.120.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.121.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.121.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.121.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.121.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.121.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.121.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.122.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.122.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.122.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.122.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.122.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.122.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.123.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.123.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.123.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.123.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.123.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.123.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.124.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.124.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.124.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.124.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.124.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.124.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.125.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.125.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.125.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.125.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.125.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.125.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.126.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.126.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.126.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.126.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.126.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.126.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.127.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.127.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.127.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.127.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.127.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.127.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.128.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.128.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.128.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.128.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.128.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.128.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.129.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.129.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.129.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.129.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.129.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.129.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.13.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.13.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.13.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.13.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.13.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.13.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.130.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.130.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.130.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.130.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.130.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.130.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.131.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.131.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.131.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.131.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.131.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.131.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.132.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.132.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.132.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.132.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.132.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.132.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.133.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.133.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.133.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.133.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.133.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.133.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.134.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.134.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.134.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.134.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.134.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.134.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.135.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.135.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.135.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.135.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.135.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.135.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.136.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.136.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.136.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.136.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.136.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.136.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.137.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.137.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.137.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.137.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.137.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.137.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.138.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.138.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.138.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.138.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.138.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.138.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.139.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.139.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.139.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.139.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.139.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.139.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.14.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.14.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.14.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.14.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.14.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.14.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.140.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.140.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.140.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.140.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.140.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.140.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.141.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.141.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.141.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.141.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.141.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.141.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.142.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.142.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.142.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.142.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.142.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.142.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.143.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.143.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.143.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.143.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.143.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.143.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.144.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.144.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.144.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.144.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.144.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.144.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.145.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.145.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.145.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.145.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.145.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.145.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.146.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.146.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.146.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.146.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.146.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.146.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.147.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.147.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.147.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.147.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.147.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.147.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.148.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.148.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.148.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.148.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.148.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.148.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.149.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.149.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.149.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.149.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.149.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.149.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.15.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.15.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.15.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.15.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.15.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.15.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.150.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.150.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.150.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.150.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.150.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.150.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.151.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.151.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.151.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.151.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.151.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.151.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.152.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.152.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.152.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.152.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.152.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.152.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.153.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.153.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.153.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.153.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.153.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.153.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.154.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.154.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.154.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.154.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.154.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.154.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.155.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.155.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.155.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.155.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.155.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.155.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.156.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.156.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.156.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.156.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.156.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.156.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.157.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.157.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.157.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.157.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.157.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.157.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.158.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.158.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.158.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.158.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.158.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.158.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.159.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.159.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.159.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.159.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.159.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.159.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.16.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.16.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.16.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.16.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.16.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.16.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.17.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.17.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.17.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.17.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.17.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.17.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.18.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.18.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.18.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.18.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.18.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.18.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.19.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.19.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.19.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.19.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.19.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.19.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.2.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.2.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.2.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.2.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.2.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.2.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.20.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.20.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.20.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.20.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.20.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.20.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.21.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.21.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.21.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.21.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.21.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.21.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.22.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.22.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.22.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.22.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.22.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.22.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.23.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.23.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.23.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.23.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.23.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.23.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.24.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.24.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.24.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.24.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.24.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.24.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.25.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.25.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.25.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.25.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.25.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.25.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.26.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.26.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.26.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.26.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.26.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.26.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.27.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.27.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.27.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.27.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.27.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.27.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.28.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.28.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.28.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.28.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.28.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.28.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.29.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.29.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.29.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.29.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.29.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.29.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.3.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.3.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.3.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.3.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.3.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.3.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.30.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.30.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.30.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.30.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.30.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.30.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.31.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.31.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.31.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.31.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.31.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.31.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.32.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.32.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.32.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.32.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.32.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.32.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.33.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.33.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.33.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.33.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.33.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.33.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.34.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.34.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.34.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.34.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.34.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.34.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.35.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.35.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.35.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.35.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.35.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.35.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.36.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.36.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.36.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.36.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.36.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.36.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.37.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.37.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.37.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.37.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.37.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.37.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.38.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.38.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.38.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.38.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.38.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.38.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.39.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.39.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.39.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.39.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.39.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.39.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.4.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.4.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.4.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.4.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.4.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.4.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.40.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.40.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.40.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.40.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.40.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.40.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.41.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.41.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.41.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.41.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.41.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.41.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.42.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.42.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.42.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.42.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.42.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.42.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.43.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.43.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.43.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.43.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.43.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.43.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.44.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.44.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.44.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.44.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.44.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.44.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.45.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.45.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.45.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.45.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.45.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.45.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.46.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.46.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.46.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.46.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.46.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.46.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.47.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.47.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.47.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.47.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.47.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.47.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.48.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.48.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.48.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.48.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.48.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.48.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.49.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.49.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.49.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.49.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.49.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.49.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.5.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.5.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.5.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.5.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.5.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.5.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.50.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.50.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.50.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.50.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.50.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.50.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.51.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.51.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.51.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.51.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.51.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.51.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.52.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.52.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.52.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.52.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.52.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.52.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.53.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.53.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.53.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.53.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.53.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.53.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.54.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.54.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.54.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.54.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.54.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.54.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.55.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.55.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.55.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.55.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.55.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.55.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.56.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.56.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.56.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.56.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.56.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.56.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.57.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.57.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.57.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.57.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.57.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.57.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.58.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.58.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.58.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.58.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.58.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.58.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.59.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.59.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.59.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.59.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.59.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.59.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.6.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.6.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.6.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.6.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.6.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.6.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.60.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.60.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.60.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.60.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.60.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.60.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.61.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.61.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.61.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.61.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.61.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.61.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.62.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.62.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.62.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.62.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.62.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.62.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.63.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.63.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.63.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.63.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.63.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.63.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.64.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.64.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.64.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.64.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.64.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.64.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.65.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.65.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.65.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.65.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.65.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.65.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.66.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.66.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.66.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.66.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.66.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.66.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.67.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.67.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.67.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.67.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.67.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.67.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.68.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.68.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.68.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.68.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.68.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.68.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.69.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.69.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.69.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.69.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.69.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.69.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.7.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.7.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.7.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.7.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.7.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.7.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.70.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.70.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.70.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.70.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.70.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.70.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.71.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.71.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.71.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.71.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.71.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.71.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.72.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.72.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.72.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.72.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.72.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.72.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.73.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.73.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.73.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.73.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.73.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.73.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.74.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.74.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.74.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.74.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.74.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.74.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.75.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.75.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.75.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.75.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.75.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.75.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.76.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.76.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.76.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.76.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.76.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.76.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.77.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.77.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.77.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.77.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.77.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.77.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.78.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.78.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.78.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.78.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.78.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.78.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.79.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.79.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.79.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.79.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.79.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.79.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.8.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.8.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.8.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.8.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.8.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.8.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.80.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.80.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.80.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.80.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.80.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.80.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.81.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.81.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.81.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.81.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.81.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.81.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.82.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.82.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.82.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.82.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.82.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.82.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.83.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.83.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.83.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.83.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.83.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.83.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.84.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.84.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.84.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.84.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.84.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.84.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.85.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.85.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.85.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.85.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.85.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.85.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.86.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.86.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.86.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.86.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.86.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.86.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.87.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.87.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.87.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.87.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.87.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.87.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.88.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.88.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.88.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.88.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.88.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.88.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.89.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.89.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.89.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.89.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.89.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.89.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.9.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.9.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.9.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.9.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.9.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.9.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.90.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.90.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.90.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.90.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.90.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.90.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.91.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.91.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.91.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.91.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.91.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.91.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.92.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.92.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.92.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.92.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.92.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.92.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.93.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.93.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.93.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.93.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.93.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.93.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.94.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.94.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.94.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.94.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.94.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.94.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.95.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.95.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.95.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.95.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.95.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.95.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.96.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.96.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.96.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.96.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.96.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.96.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.97.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.97.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.97.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.97.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.97.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.97.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.98.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.98.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.98.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.98.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.98.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.98.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.99.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.99.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.99.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.99.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.99.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.experts.99.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.gate.e_score_correction_bias": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.gate.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.shared_experts.down_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.shared_experts.down_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.shared_experts.gate_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.shared_experts.gate_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.shared_experts.up_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.mlp.shared_experts.up_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.post_attention_layernorm.weight": "model-00051-of-00092.safetensors", + "model.layers.50.self_attn.k_norm.weight": "model-00051-of-00092.safetensors", + "model.layers.50.self_attn.k_proj.bias": "model-00051-of-00092.safetensors", + "model.layers.50.self_attn.k_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.self_attn.k_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.self_attn.o_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.self_attn.o_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.self_attn.q_norm.weight": "model-00051-of-00092.safetensors", + "model.layers.50.self_attn.q_proj.bias": "model-00051-of-00092.safetensors", + "model.layers.50.self_attn.q_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.self_attn.q_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.50.self_attn.v_proj.bias": "model-00051-of-00092.safetensors", + "model.layers.50.self_attn.v_proj.weight": "model-00051-of-00092.safetensors", + "model.layers.50.self_attn.v_proj.weight_scale": "model-00051-of-00092.safetensors", + "model.layers.51.input_layernorm.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.0.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.0.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.0.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.0.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.0.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.0.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.1.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.1.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.1.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.1.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.1.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.1.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.10.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.10.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.10.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.10.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.10.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.10.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.100.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.100.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.100.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.100.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.100.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.100.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.101.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.101.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.101.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.101.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.101.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.101.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.102.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.102.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.102.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.102.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.102.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.102.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.103.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.103.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.103.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.103.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.103.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.103.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.104.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.104.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.104.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.104.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.104.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.104.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.105.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.105.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.105.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.105.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.105.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.105.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.106.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.106.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.106.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.106.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.106.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.106.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.107.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.107.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.107.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.107.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.107.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.107.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.108.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.108.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.108.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.108.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.108.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.108.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.109.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.109.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.109.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.109.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.109.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.109.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.11.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.11.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.11.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.11.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.11.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.11.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.110.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.110.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.110.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.110.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.110.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.110.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.111.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.111.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.111.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.111.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.111.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.111.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.112.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.112.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.112.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.112.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.112.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.112.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.113.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.113.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.113.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.113.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.113.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.113.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.114.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.114.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.114.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.114.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.114.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.114.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.115.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.115.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.115.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.115.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.115.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.115.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.116.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.116.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.116.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.116.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.116.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.116.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.117.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.117.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.117.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.117.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.117.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.117.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.118.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.118.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.118.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.118.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.118.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.118.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.119.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.119.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.119.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.119.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.119.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.119.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.12.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.12.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.12.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.12.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.12.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.12.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.120.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.120.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.120.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.120.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.120.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.120.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.121.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.121.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.121.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.121.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.121.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.121.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.122.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.122.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.122.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.122.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.122.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.122.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.123.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.123.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.123.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.123.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.123.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.123.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.124.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.124.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.124.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.124.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.124.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.124.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.125.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.125.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.125.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.125.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.125.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.125.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.126.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.126.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.126.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.126.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.126.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.126.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.127.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.127.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.127.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.127.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.127.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.127.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.128.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.128.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.128.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.128.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.128.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.128.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.129.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.129.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.129.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.129.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.129.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.129.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.13.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.13.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.13.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.13.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.13.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.13.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.130.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.130.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.130.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.130.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.130.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.130.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.131.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.131.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.131.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.131.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.131.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.131.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.132.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.132.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.132.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.132.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.132.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.132.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.133.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.133.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.133.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.133.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.133.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.133.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.134.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.134.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.134.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.134.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.134.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.134.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.135.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.135.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.135.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.135.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.135.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.135.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.136.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.136.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.136.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.136.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.136.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.136.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.137.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.137.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.137.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.137.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.137.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.137.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.138.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.138.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.138.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.138.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.138.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.138.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.139.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.139.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.139.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.139.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.139.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.139.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.14.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.14.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.14.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.14.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.14.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.14.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.140.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.140.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.140.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.140.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.140.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.140.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.141.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.141.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.141.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.141.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.141.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.141.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.142.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.142.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.142.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.142.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.142.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.142.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.143.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.143.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.143.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.143.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.143.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.143.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.144.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.144.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.144.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.144.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.144.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.144.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.145.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.145.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.145.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.145.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.145.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.145.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.146.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.146.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.146.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.146.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.146.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.146.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.147.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.147.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.147.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.147.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.147.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.147.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.148.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.148.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.148.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.148.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.148.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.148.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.149.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.149.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.149.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.149.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.149.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.149.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.15.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.15.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.15.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.15.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.15.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.15.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.150.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.150.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.150.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.150.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.150.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.150.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.151.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.151.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.151.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.151.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.151.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.151.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.152.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.152.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.152.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.152.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.152.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.152.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.153.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.153.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.153.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.153.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.153.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.153.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.154.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.154.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.154.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.154.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.154.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.154.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.155.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.155.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.155.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.155.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.155.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.155.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.156.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.156.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.156.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.156.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.156.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.156.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.157.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.157.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.157.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.157.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.157.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.157.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.158.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.158.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.158.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.158.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.158.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.158.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.159.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.159.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.159.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.159.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.159.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.159.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.16.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.16.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.16.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.16.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.16.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.16.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.17.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.17.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.17.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.17.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.17.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.17.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.18.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.18.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.18.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.18.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.18.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.18.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.19.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.19.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.19.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.19.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.19.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.19.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.2.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.2.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.2.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.2.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.2.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.2.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.20.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.20.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.20.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.20.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.20.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.20.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.21.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.21.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.21.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.21.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.21.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.21.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.22.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.22.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.22.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.22.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.22.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.22.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.23.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.23.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.23.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.23.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.23.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.23.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.24.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.24.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.24.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.24.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.24.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.24.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.25.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.25.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.25.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.25.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.25.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.25.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.26.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.26.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.26.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.26.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.26.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.26.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.27.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.27.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.27.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.27.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.27.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.27.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.28.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.28.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.28.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.28.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.28.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.28.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.29.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.29.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.29.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.29.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.29.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.29.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.3.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.3.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.3.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.3.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.3.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.3.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.30.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.30.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.30.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.30.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.30.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.30.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.31.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.31.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.31.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.31.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.31.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.31.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.32.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.32.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.32.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.32.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.32.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.32.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.33.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.33.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.33.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.33.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.33.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.33.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.34.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.34.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.34.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.34.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.34.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.34.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.35.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.35.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.35.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.35.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.35.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.35.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.36.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.36.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.36.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.36.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.36.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.36.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.37.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.37.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.37.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.37.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.37.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.37.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.38.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.38.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.38.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.38.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.38.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.38.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.39.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.39.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.39.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.39.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.39.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.39.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.4.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.4.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.4.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.4.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.4.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.4.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.40.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.40.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.40.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.40.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.40.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.40.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.41.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.41.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.41.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.41.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.41.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.41.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.42.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.42.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.42.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.42.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.42.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.42.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.43.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.43.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.43.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.43.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.43.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.43.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.44.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.44.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.44.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.44.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.44.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.44.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.45.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.45.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.45.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.45.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.45.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.45.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.46.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.46.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.46.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.46.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.46.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.46.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.47.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.47.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.47.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.47.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.47.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.47.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.48.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.48.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.48.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.48.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.48.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.48.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.49.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.49.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.49.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.49.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.49.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.49.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.5.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.5.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.5.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.5.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.5.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.5.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.50.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.50.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.50.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.50.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.50.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.50.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.51.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.51.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.51.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.51.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.51.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.51.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.52.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.52.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.52.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.52.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.52.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.52.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.53.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.53.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.53.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.53.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.53.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.53.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.54.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.54.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.54.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.54.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.54.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.54.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.55.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.55.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.55.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.55.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.55.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.55.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.56.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.56.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.56.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.56.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.56.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.56.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.57.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.57.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.57.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.57.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.57.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.57.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.58.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.58.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.58.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.58.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.58.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.58.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.59.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.59.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.59.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.59.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.59.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.59.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.6.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.6.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.6.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.6.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.6.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.6.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.60.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.60.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.60.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.60.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.60.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.60.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.61.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.61.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.61.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.61.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.61.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.61.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.62.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.62.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.62.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.62.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.62.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.62.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.63.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.63.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.63.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.63.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.63.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.63.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.64.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.64.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.64.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.64.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.64.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.64.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.65.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.65.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.65.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.65.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.65.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.65.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.66.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.66.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.66.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.66.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.66.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.66.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.67.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.67.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.67.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.67.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.67.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.67.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.68.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.68.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.68.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.68.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.68.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.68.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.69.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.69.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.69.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.69.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.69.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.69.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.7.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.7.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.7.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.7.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.7.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.7.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.70.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.70.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.70.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.70.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.70.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.70.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.71.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.71.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.71.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.71.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.71.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.71.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.72.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.72.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.72.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.72.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.72.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.72.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.73.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.73.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.73.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.73.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.73.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.73.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.74.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.74.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.74.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.74.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.74.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.74.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.75.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.75.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.75.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.75.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.75.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.75.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.76.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.76.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.76.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.76.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.76.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.76.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.77.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.77.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.77.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.77.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.77.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.77.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.78.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.78.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.78.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.78.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.78.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.78.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.79.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.79.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.79.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.79.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.79.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.79.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.8.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.8.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.8.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.8.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.8.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.8.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.80.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.80.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.80.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.80.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.80.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.80.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.81.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.81.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.81.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.81.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.81.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.81.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.82.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.82.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.82.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.82.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.82.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.82.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.83.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.83.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.83.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.83.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.83.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.83.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.84.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.84.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.84.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.84.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.84.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.84.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.85.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.85.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.85.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.85.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.85.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.85.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.86.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.86.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.86.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.86.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.86.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.86.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.87.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.87.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.87.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.87.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.87.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.87.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.88.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.88.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.88.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.88.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.88.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.88.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.89.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.89.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.89.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.89.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.89.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.89.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.9.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.9.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.9.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.9.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.9.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.9.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.90.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.90.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.90.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.90.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.90.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.90.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.91.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.91.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.91.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.91.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.91.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.91.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.92.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.92.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.92.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.92.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.92.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.92.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.93.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.93.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.93.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.93.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.93.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.93.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.94.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.94.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.94.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.94.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.94.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.94.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.95.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.95.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.95.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.95.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.95.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.95.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.96.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.96.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.96.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.96.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.96.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.96.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.97.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.97.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.97.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.97.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.97.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.97.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.98.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.98.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.98.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.98.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.98.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.98.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.99.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.99.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.99.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.99.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.99.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.experts.99.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.gate.e_score_correction_bias": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.gate.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.shared_experts.down_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.shared_experts.down_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.shared_experts.gate_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.shared_experts.gate_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.shared_experts.up_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.mlp.shared_experts.up_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.post_attention_layernorm.weight": "model-00052-of-00092.safetensors", + "model.layers.51.self_attn.k_norm.weight": "model-00052-of-00092.safetensors", + "model.layers.51.self_attn.k_proj.bias": "model-00052-of-00092.safetensors", + "model.layers.51.self_attn.k_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.self_attn.k_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.self_attn.o_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.self_attn.o_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.self_attn.q_norm.weight": "model-00052-of-00092.safetensors", + "model.layers.51.self_attn.q_proj.bias": "model-00052-of-00092.safetensors", + "model.layers.51.self_attn.q_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.self_attn.q_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.51.self_attn.v_proj.bias": "model-00052-of-00092.safetensors", + "model.layers.51.self_attn.v_proj.weight": "model-00052-of-00092.safetensors", + "model.layers.51.self_attn.v_proj.weight_scale": "model-00052-of-00092.safetensors", + "model.layers.52.input_layernorm.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.0.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.0.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.0.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.0.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.0.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.0.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.1.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.1.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.1.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.1.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.1.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.1.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.10.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.10.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.10.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.10.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.10.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.10.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.100.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.100.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.100.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.100.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.100.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.100.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.101.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.101.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.101.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.101.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.101.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.101.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.102.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.102.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.102.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.102.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.102.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.102.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.103.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.103.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.103.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.103.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.103.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.103.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.104.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.104.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.104.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.104.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.104.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.104.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.105.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.105.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.105.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.105.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.105.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.105.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.106.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.106.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.106.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.106.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.106.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.106.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.107.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.107.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.107.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.107.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.107.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.107.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.108.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.108.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.108.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.108.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.108.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.108.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.109.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.109.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.109.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.109.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.109.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.109.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.11.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.11.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.11.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.11.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.11.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.11.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.110.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.110.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.110.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.110.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.110.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.110.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.111.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.111.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.111.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.111.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.111.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.111.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.112.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.112.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.112.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.112.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.112.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.112.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.113.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.113.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.113.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.113.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.113.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.113.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.114.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.114.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.114.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.114.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.114.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.114.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.115.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.115.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.115.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.115.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.115.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.115.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.116.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.116.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.116.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.116.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.116.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.116.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.117.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.117.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.117.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.117.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.117.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.117.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.118.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.118.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.118.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.118.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.118.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.118.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.119.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.119.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.119.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.119.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.119.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.119.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.12.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.12.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.12.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.12.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.12.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.12.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.120.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.120.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.120.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.120.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.120.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.120.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.121.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.121.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.121.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.121.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.121.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.121.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.122.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.122.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.122.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.122.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.122.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.122.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.123.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.123.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.123.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.123.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.123.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.123.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.124.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.124.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.124.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.124.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.124.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.124.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.125.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.125.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.125.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.125.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.125.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.125.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.126.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.126.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.126.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.126.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.126.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.126.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.127.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.127.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.127.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.127.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.127.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.127.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.128.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.128.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.128.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.128.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.128.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.128.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.129.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.129.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.129.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.129.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.129.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.129.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.13.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.13.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.13.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.13.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.13.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.13.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.130.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.130.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.130.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.130.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.130.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.130.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.131.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.131.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.131.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.131.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.131.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.131.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.132.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.132.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.132.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.132.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.132.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.132.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.133.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.133.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.133.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.133.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.133.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.133.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.134.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.134.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.134.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.134.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.134.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.134.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.135.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.135.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.135.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.135.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.135.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.135.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.136.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.136.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.136.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.136.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.136.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.136.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.137.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.137.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.137.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.137.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.137.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.137.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.138.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.138.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.138.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.138.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.138.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.138.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.139.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.139.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.139.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.139.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.139.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.139.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.14.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.14.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.14.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.14.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.14.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.14.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.140.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.140.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.140.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.140.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.140.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.140.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.141.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.141.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.141.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.141.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.141.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.141.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.142.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.142.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.142.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.142.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.142.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.142.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.143.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.143.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.143.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.143.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.143.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.143.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.144.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.144.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.144.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.144.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.144.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.144.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.145.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.145.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.145.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.145.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.145.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.145.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.146.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.146.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.146.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.146.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.146.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.146.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.147.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.147.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.147.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.147.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.147.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.147.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.148.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.148.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.148.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.148.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.148.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.148.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.149.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.149.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.149.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.149.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.149.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.149.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.15.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.15.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.15.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.15.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.15.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.15.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.150.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.150.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.150.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.150.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.150.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.150.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.151.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.151.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.151.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.151.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.151.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.151.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.152.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.152.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.152.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.152.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.152.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.152.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.153.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.153.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.153.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.153.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.153.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.153.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.154.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.154.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.154.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.154.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.154.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.154.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.155.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.155.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.155.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.155.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.155.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.155.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.156.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.156.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.156.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.156.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.156.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.156.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.157.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.157.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.157.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.157.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.157.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.157.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.158.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.158.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.158.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.158.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.158.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.158.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.159.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.159.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.159.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.159.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.159.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.159.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.16.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.16.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.16.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.16.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.16.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.16.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.17.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.17.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.17.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.17.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.17.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.17.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.18.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.18.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.18.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.18.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.18.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.18.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.19.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.19.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.19.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.19.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.19.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.19.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.2.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.2.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.2.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.2.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.2.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.2.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.20.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.20.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.20.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.20.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.20.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.20.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.21.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.21.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.21.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.21.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.21.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.21.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.22.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.22.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.22.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.22.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.22.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.22.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.23.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.23.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.23.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.23.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.23.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.23.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.24.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.24.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.24.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.24.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.24.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.24.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.25.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.25.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.25.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.25.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.25.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.25.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.26.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.26.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.26.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.26.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.26.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.26.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.27.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.27.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.27.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.27.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.27.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.27.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.28.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.28.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.28.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.28.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.28.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.28.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.29.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.29.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.29.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.29.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.29.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.29.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.3.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.3.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.3.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.3.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.3.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.3.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.30.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.30.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.30.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.30.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.30.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.30.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.31.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.31.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.31.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.31.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.31.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.31.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.32.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.32.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.32.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.32.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.32.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.32.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.33.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.33.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.33.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.33.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.33.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.33.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.34.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.34.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.34.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.34.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.34.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.34.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.35.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.35.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.35.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.35.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.35.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.35.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.36.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.36.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.36.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.36.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.36.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.36.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.37.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.37.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.37.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.37.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.37.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.37.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.38.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.38.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.38.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.38.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.38.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.38.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.39.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.39.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.39.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.39.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.39.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.39.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.4.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.4.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.4.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.4.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.4.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.4.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.40.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.40.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.40.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.40.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.40.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.40.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.41.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.41.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.41.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.41.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.41.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.41.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.42.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.42.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.42.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.42.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.42.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.42.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.43.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.43.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.43.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.43.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.43.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.43.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.44.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.44.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.44.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.44.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.44.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.44.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.45.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.45.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.45.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.45.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.45.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.45.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.46.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.46.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.46.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.46.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.46.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.46.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.47.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.47.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.47.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.47.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.47.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.47.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.48.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.48.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.48.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.48.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.48.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.48.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.49.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.49.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.49.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.49.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.49.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.49.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.5.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.5.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.5.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.5.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.5.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.5.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.50.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.50.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.50.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.50.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.50.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.50.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.51.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.51.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.51.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.51.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.51.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.51.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.52.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.52.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.52.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.52.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.52.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.52.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.53.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.53.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.53.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.53.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.53.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.53.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.54.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.54.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.54.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.54.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.54.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.54.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.55.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.55.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.55.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.55.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.55.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.55.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.56.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.56.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.56.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.56.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.56.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.56.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.57.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.57.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.57.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.57.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.57.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.57.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.58.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.58.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.58.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.58.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.58.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.58.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.59.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.59.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.59.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.59.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.59.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.59.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.6.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.6.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.6.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.6.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.6.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.6.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.60.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.60.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.60.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.60.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.60.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.60.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.61.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.61.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.61.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.61.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.61.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.61.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.62.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.62.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.62.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.62.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.62.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.62.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.63.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.63.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.63.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.63.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.63.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.63.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.64.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.64.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.64.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.64.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.64.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.64.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.65.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.65.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.65.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.65.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.65.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.65.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.66.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.66.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.66.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.66.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.66.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.66.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.67.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.67.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.67.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.67.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.67.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.67.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.68.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.68.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.68.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.68.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.68.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.68.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.69.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.69.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.69.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.69.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.69.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.69.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.7.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.7.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.7.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.7.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.7.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.7.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.70.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.70.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.70.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.70.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.70.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.70.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.71.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.71.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.71.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.71.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.71.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.71.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.72.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.72.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.72.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.72.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.72.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.72.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.73.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.73.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.73.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.73.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.73.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.73.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.74.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.74.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.74.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.74.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.74.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.74.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.75.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.75.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.75.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.75.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.75.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.75.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.76.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.76.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.76.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.76.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.76.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.76.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.77.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.77.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.77.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.77.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.77.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.77.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.78.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.78.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.78.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.78.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.78.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.78.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.79.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.79.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.79.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.79.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.79.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.79.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.8.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.8.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.8.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.8.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.8.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.8.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.80.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.80.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.80.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.80.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.80.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.80.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.81.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.81.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.81.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.81.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.81.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.81.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.82.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.82.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.82.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.82.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.82.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.82.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.83.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.83.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.83.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.83.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.83.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.83.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.84.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.84.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.84.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.84.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.84.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.84.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.85.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.85.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.85.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.85.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.85.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.85.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.86.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.86.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.86.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.86.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.86.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.86.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.87.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.87.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.87.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.87.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.87.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.87.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.88.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.88.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.88.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.88.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.88.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.88.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.89.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.89.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.89.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.89.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.89.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.89.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.9.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.9.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.9.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.9.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.9.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.9.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.90.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.90.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.90.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.90.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.90.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.90.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.91.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.91.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.91.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.91.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.91.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.91.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.92.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.92.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.92.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.92.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.92.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.92.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.93.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.93.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.93.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.93.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.93.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.93.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.94.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.94.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.94.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.94.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.94.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.94.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.95.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.95.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.95.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.95.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.95.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.95.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.96.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.96.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.96.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.96.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.96.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.96.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.97.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.97.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.97.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.97.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.97.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.97.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.98.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.98.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.98.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.98.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.98.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.98.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.99.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.99.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.99.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.99.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.99.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.experts.99.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.gate.e_score_correction_bias": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.gate.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.shared_experts.down_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.shared_experts.down_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.shared_experts.gate_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.shared_experts.gate_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.shared_experts.up_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.mlp.shared_experts.up_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.post_attention_layernorm.weight": "model-00053-of-00092.safetensors", + "model.layers.52.self_attn.k_norm.weight": "model-00053-of-00092.safetensors", + "model.layers.52.self_attn.k_proj.bias": "model-00053-of-00092.safetensors", + "model.layers.52.self_attn.k_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.self_attn.k_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.self_attn.o_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.self_attn.o_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.self_attn.q_norm.weight": "model-00053-of-00092.safetensors", + "model.layers.52.self_attn.q_proj.bias": "model-00053-of-00092.safetensors", + "model.layers.52.self_attn.q_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.self_attn.q_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.52.self_attn.v_proj.bias": "model-00053-of-00092.safetensors", + "model.layers.52.self_attn.v_proj.weight": "model-00053-of-00092.safetensors", + "model.layers.52.self_attn.v_proj.weight_scale": "model-00053-of-00092.safetensors", + "model.layers.53.input_layernorm.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.0.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.0.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.0.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.0.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.0.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.0.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.1.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.1.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.1.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.1.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.1.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.1.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.10.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.10.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.10.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.10.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.10.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.10.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.100.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.100.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.100.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.100.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.100.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.100.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.101.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.101.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.101.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.101.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.101.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.101.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.102.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.102.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.102.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.102.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.102.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.102.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.103.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.103.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.103.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.103.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.103.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.103.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.104.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.104.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.104.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.104.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.104.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.104.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.105.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.105.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.105.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.105.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.105.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.105.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.106.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.106.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.106.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.106.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.106.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.106.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.107.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.107.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.107.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.107.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.107.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.107.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.108.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.108.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.108.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.108.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.108.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.108.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.109.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.109.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.109.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.109.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.109.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.109.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.11.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.11.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.11.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.11.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.11.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.11.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.110.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.110.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.110.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.110.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.110.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.110.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.111.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.111.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.111.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.111.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.111.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.111.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.112.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.112.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.112.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.112.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.112.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.112.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.113.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.113.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.113.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.113.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.113.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.113.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.114.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.114.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.114.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.114.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.114.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.114.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.115.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.115.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.115.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.115.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.115.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.115.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.116.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.116.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.116.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.116.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.116.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.116.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.117.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.117.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.117.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.117.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.117.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.117.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.118.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.118.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.118.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.118.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.118.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.118.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.119.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.119.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.119.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.119.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.119.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.119.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.12.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.12.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.12.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.12.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.12.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.12.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.120.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.120.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.120.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.120.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.120.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.120.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.121.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.121.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.121.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.121.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.121.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.121.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.122.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.122.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.122.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.122.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.122.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.122.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.123.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.123.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.123.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.123.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.123.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.123.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.124.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.124.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.124.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.124.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.124.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.124.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.125.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.125.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.125.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.125.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.125.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.125.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.126.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.126.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.126.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.126.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.126.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.126.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.127.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.127.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.127.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.127.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.127.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.127.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.128.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.128.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.128.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.128.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.128.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.128.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.129.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.129.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.129.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.129.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.129.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.129.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.13.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.13.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.13.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.13.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.13.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.13.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.130.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.130.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.130.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.130.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.130.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.130.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.131.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.131.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.131.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.131.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.131.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.131.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.132.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.132.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.132.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.132.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.132.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.132.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.133.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.133.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.133.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.133.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.133.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.133.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.134.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.134.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.134.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.134.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.134.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.134.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.135.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.135.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.135.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.135.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.135.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.135.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.136.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.136.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.136.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.136.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.136.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.136.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.137.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.137.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.137.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.137.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.137.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.137.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.138.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.138.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.138.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.138.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.138.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.138.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.139.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.139.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.139.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.139.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.139.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.139.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.14.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.14.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.14.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.14.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.14.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.14.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.140.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.140.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.140.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.140.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.140.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.140.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.141.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.141.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.141.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.141.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.141.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.141.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.142.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.142.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.142.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.142.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.142.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.142.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.143.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.143.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.143.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.143.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.143.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.143.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.144.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.144.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.144.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.144.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.144.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.144.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.145.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.145.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.145.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.145.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.145.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.145.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.146.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.146.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.146.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.146.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.146.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.146.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.147.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.147.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.147.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.147.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.147.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.147.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.148.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.148.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.148.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.148.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.148.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.148.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.149.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.149.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.149.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.149.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.149.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.149.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.15.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.15.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.15.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.15.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.15.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.15.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.150.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.150.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.150.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.150.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.150.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.150.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.151.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.151.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.151.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.151.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.151.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.151.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.152.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.152.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.152.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.152.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.152.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.152.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.153.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.153.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.153.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.153.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.153.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.153.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.154.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.154.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.154.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.154.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.154.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.154.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.155.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.155.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.155.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.155.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.155.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.155.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.156.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.156.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.156.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.156.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.156.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.156.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.157.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.157.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.157.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.157.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.157.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.157.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.158.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.158.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.158.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.158.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.158.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.158.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.159.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.159.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.159.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.159.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.159.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.159.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.16.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.16.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.16.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.16.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.16.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.16.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.17.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.17.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.17.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.17.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.17.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.17.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.18.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.18.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.18.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.18.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.18.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.18.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.19.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.19.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.19.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.19.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.19.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.19.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.2.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.2.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.2.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.2.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.2.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.2.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.20.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.20.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.20.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.20.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.20.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.20.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.21.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.21.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.21.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.21.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.21.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.21.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.22.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.22.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.22.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.22.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.22.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.22.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.23.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.23.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.23.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.23.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.23.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.23.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.24.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.24.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.24.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.24.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.24.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.24.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.25.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.25.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.25.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.25.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.25.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.25.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.26.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.26.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.26.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.26.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.26.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.26.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.27.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.27.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.27.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.27.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.27.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.27.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.28.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.28.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.28.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.28.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.28.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.28.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.29.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.29.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.29.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.29.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.29.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.29.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.3.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.3.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.3.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.3.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.3.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.3.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.30.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.30.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.30.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.30.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.30.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.30.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.31.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.31.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.31.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.31.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.31.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.31.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.32.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.32.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.32.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.32.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.32.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.32.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.33.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.33.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.33.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.33.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.33.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.33.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.34.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.34.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.34.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.34.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.34.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.34.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.35.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.35.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.35.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.35.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.35.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.35.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.36.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.36.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.36.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.36.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.36.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.36.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.37.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.37.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.37.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.37.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.37.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.37.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.38.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.38.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.38.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.38.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.38.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.38.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.39.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.39.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.39.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.39.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.39.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.39.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.4.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.4.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.4.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.4.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.4.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.4.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.40.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.40.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.40.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.40.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.40.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.40.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.41.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.41.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.41.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.41.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.41.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.41.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.42.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.42.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.42.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.42.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.42.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.42.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.43.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.43.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.43.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.43.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.43.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.43.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.44.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.44.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.44.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.44.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.44.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.44.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.45.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.45.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.45.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.45.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.45.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.45.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.46.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.46.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.46.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.46.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.46.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.46.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.47.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.47.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.47.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.47.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.47.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.47.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.48.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.48.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.48.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.48.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.48.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.48.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.49.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.49.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.49.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.49.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.49.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.49.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.5.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.5.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.5.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.5.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.5.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.5.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.50.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.50.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.50.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.50.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.50.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.50.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.51.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.51.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.51.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.51.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.51.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.51.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.52.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.52.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.52.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.52.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.52.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.52.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.53.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.53.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.53.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.53.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.53.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.53.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.54.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.54.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.54.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.54.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.54.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.54.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.55.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.55.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.55.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.55.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.55.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.55.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.56.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.56.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.56.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.56.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.56.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.56.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.57.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.57.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.57.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.57.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.57.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.57.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.58.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.58.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.58.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.58.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.58.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.58.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.59.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.59.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.59.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.59.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.59.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.59.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.6.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.6.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.6.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.6.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.6.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.6.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.60.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.60.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.60.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.60.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.60.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.60.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.61.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.61.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.61.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.61.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.61.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.61.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.62.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.62.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.62.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.62.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.62.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.62.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.63.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.63.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.63.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.63.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.63.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.63.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.64.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.64.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.64.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.64.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.64.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.64.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.65.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.65.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.65.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.65.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.65.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.65.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.66.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.66.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.66.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.66.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.66.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.66.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.67.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.67.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.67.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.67.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.67.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.67.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.68.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.68.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.68.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.68.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.68.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.68.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.69.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.69.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.69.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.69.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.69.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.69.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.7.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.7.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.7.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.7.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.7.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.7.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.70.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.70.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.70.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.70.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.70.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.70.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.71.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.71.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.71.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.71.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.71.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.71.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.72.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.72.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.72.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.72.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.72.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.72.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.73.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.73.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.73.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.73.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.73.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.73.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.74.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.74.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.74.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.74.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.74.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.74.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.75.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.75.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.75.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.75.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.75.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.75.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.76.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.76.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.76.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.76.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.76.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.76.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.77.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.77.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.77.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.77.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.77.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.77.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.78.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.78.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.78.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.78.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.78.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.78.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.79.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.79.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.79.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.79.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.79.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.79.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.8.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.8.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.8.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.8.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.8.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.8.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.80.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.80.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.80.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.80.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.80.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.80.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.81.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.81.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.81.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.81.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.81.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.81.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.82.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.82.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.82.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.82.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.82.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.82.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.83.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.83.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.83.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.83.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.83.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.83.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.84.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.84.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.84.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.84.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.84.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.84.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.85.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.85.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.85.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.85.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.85.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.85.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.86.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.86.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.86.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.86.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.86.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.86.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.87.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.87.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.87.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.87.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.87.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.87.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.88.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.88.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.88.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.88.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.88.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.88.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.89.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.89.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.89.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.89.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.89.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.89.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.9.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.9.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.9.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.9.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.9.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.9.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.90.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.90.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.90.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.90.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.90.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.90.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.91.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.91.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.91.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.91.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.91.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.91.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.92.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.92.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.92.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.92.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.92.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.92.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.93.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.93.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.93.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.93.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.93.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.93.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.94.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.94.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.94.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.94.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.94.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.94.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.95.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.95.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.95.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.95.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.95.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.95.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.96.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.96.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.96.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.96.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.96.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.96.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.97.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.97.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.97.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.97.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.97.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.97.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.98.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.98.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.98.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.98.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.98.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.98.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.99.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.99.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.99.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.99.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.99.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.experts.99.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.gate.e_score_correction_bias": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.gate.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.shared_experts.down_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.shared_experts.down_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.shared_experts.gate_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.shared_experts.gate_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.shared_experts.up_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.mlp.shared_experts.up_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.post_attention_layernorm.weight": "model-00054-of-00092.safetensors", + "model.layers.53.self_attn.k_norm.weight": "model-00054-of-00092.safetensors", + "model.layers.53.self_attn.k_proj.bias": "model-00054-of-00092.safetensors", + "model.layers.53.self_attn.k_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.self_attn.k_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.self_attn.o_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.self_attn.o_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.self_attn.q_norm.weight": "model-00054-of-00092.safetensors", + "model.layers.53.self_attn.q_proj.bias": "model-00054-of-00092.safetensors", + "model.layers.53.self_attn.q_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.self_attn.q_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.53.self_attn.v_proj.bias": "model-00054-of-00092.safetensors", + "model.layers.53.self_attn.v_proj.weight": "model-00054-of-00092.safetensors", + "model.layers.53.self_attn.v_proj.weight_scale": "model-00054-of-00092.safetensors", + "model.layers.54.input_layernorm.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.0.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.0.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.0.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.0.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.0.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.0.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.1.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.1.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.1.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.1.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.1.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.1.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.10.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.10.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.10.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.10.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.10.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.10.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.100.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.100.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.100.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.100.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.100.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.100.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.101.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.101.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.101.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.101.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.101.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.101.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.102.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.102.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.102.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.102.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.102.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.102.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.103.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.103.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.103.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.103.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.103.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.103.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.104.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.104.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.104.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.104.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.104.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.104.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.105.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.105.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.105.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.105.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.105.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.105.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.106.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.106.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.106.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.106.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.106.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.106.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.107.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.107.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.107.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.107.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.107.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.107.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.108.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.108.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.108.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.108.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.108.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.108.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.109.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.109.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.109.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.109.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.109.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.109.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.11.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.11.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.11.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.11.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.11.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.11.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.110.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.110.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.110.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.110.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.110.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.110.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.111.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.111.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.111.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.111.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.111.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.111.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.112.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.112.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.112.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.112.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.112.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.112.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.113.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.113.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.113.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.113.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.113.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.113.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.114.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.114.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.114.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.114.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.114.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.114.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.115.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.115.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.115.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.115.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.115.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.115.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.116.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.116.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.116.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.116.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.116.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.116.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.117.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.117.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.117.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.117.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.117.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.117.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.118.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.118.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.118.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.118.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.118.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.118.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.119.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.119.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.119.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.119.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.119.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.119.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.12.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.12.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.12.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.12.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.12.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.12.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.120.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.120.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.120.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.120.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.120.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.120.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.121.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.121.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.121.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.121.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.121.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.121.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.122.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.122.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.122.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.122.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.122.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.122.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.123.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.123.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.123.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.123.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.123.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.123.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.124.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.124.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.124.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.124.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.124.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.124.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.125.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.125.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.125.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.125.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.125.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.125.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.126.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.126.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.126.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.126.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.126.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.126.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.127.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.127.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.127.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.127.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.127.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.127.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.128.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.128.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.128.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.128.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.128.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.128.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.129.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.129.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.129.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.129.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.129.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.129.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.13.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.13.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.13.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.13.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.13.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.13.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.130.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.130.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.130.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.130.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.130.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.130.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.131.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.131.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.131.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.131.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.131.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.131.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.132.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.132.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.132.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.132.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.132.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.132.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.133.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.133.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.133.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.133.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.133.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.133.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.134.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.134.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.134.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.134.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.134.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.134.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.135.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.135.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.135.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.135.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.135.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.135.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.136.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.136.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.136.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.136.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.136.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.136.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.137.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.137.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.137.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.137.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.137.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.137.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.138.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.138.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.138.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.138.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.138.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.138.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.139.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.139.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.139.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.139.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.139.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.139.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.14.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.14.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.14.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.14.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.14.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.14.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.140.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.140.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.140.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.140.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.140.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.140.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.141.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.141.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.141.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.141.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.141.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.141.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.142.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.142.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.142.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.142.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.142.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.142.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.143.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.143.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.143.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.143.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.143.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.143.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.144.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.144.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.144.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.144.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.144.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.144.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.145.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.145.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.145.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.145.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.145.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.145.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.146.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.146.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.146.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.146.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.146.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.146.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.147.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.147.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.147.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.147.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.147.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.147.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.148.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.148.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.148.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.148.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.148.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.148.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.149.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.149.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.149.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.149.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.149.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.149.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.15.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.15.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.15.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.15.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.15.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.15.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.150.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.150.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.150.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.150.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.150.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.150.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.151.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.151.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.151.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.151.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.151.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.151.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.152.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.152.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.152.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.152.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.152.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.152.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.153.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.153.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.153.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.153.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.153.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.153.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.154.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.154.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.154.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.154.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.154.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.154.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.155.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.155.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.155.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.155.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.155.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.155.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.156.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.156.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.156.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.156.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.156.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.156.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.157.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.157.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.157.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.157.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.157.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.157.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.158.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.158.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.158.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.158.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.158.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.158.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.159.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.159.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.159.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.159.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.159.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.159.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.16.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.16.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.16.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.16.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.16.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.16.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.17.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.17.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.17.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.17.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.17.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.17.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.18.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.18.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.18.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.18.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.18.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.18.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.19.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.19.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.19.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.19.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.19.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.19.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.2.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.2.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.2.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.2.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.2.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.2.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.20.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.20.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.20.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.20.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.20.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.20.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.21.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.21.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.21.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.21.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.21.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.21.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.22.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.22.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.22.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.22.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.22.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.22.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.23.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.23.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.23.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.23.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.23.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.23.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.24.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.24.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.24.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.24.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.24.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.24.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.25.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.25.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.25.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.25.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.25.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.25.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.26.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.26.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.26.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.26.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.26.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.26.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.27.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.27.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.27.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.27.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.27.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.27.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.28.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.28.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.28.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.28.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.28.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.28.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.29.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.29.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.29.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.29.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.29.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.29.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.3.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.3.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.3.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.3.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.3.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.3.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.30.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.30.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.30.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.30.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.30.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.30.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.31.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.31.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.31.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.31.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.31.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.31.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.32.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.32.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.32.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.32.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.32.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.32.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.33.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.33.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.33.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.33.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.33.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.33.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.34.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.34.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.34.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.34.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.34.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.34.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.35.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.35.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.35.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.35.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.35.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.35.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.36.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.36.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.36.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.36.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.36.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.36.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.37.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.37.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.37.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.37.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.37.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.37.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.38.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.38.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.38.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.38.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.38.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.38.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.39.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.39.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.39.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.39.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.39.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.39.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.4.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.4.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.4.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.4.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.4.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.4.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.40.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.40.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.40.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.40.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.40.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.40.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.41.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.41.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.41.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.41.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.41.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.41.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.42.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.42.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.42.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.42.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.42.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.42.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.43.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.43.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.43.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.43.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.43.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.43.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.44.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.44.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.44.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.44.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.44.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.44.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.45.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.45.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.45.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.45.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.45.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.45.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.46.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.46.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.46.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.46.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.46.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.46.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.47.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.47.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.47.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.47.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.47.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.47.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.48.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.48.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.48.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.48.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.48.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.48.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.49.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.49.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.49.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.49.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.49.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.49.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.5.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.5.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.5.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.5.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.5.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.5.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.50.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.50.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.50.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.50.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.50.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.50.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.51.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.51.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.51.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.51.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.51.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.51.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.52.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.52.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.52.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.52.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.52.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.52.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.53.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.53.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.53.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.53.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.53.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.53.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.54.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.54.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.54.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.54.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.54.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.54.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.55.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.55.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.55.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.55.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.55.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.55.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.56.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.56.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.56.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.56.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.56.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.56.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.57.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.57.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.57.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.57.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.57.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.57.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.58.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.58.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.58.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.58.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.58.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.58.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.59.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.59.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.59.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.59.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.59.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.59.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.6.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.6.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.6.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.6.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.6.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.6.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.60.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.60.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.60.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.60.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.60.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.60.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.61.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.61.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.61.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.61.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.61.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.61.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.62.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.62.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.62.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.62.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.62.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.62.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.63.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.63.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.63.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.63.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.63.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.63.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.64.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.64.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.64.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.64.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.64.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.64.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.65.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.65.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.65.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.65.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.65.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.65.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.66.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.66.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.66.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.66.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.66.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.66.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.67.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.67.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.67.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.67.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.67.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.67.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.68.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.68.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.68.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.68.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.68.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.68.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.69.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.69.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.69.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.69.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.69.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.69.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.7.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.7.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.7.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.7.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.7.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.7.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.70.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.70.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.70.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.70.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.70.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.70.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.71.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.71.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.71.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.71.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.71.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.71.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.72.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.72.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.72.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.72.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.72.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.72.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.73.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.73.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.73.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.73.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.73.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.73.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.74.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.74.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.74.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.74.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.74.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.74.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.75.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.75.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.75.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.75.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.75.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.75.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.76.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.76.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.76.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.76.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.76.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.76.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.77.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.77.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.77.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.77.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.77.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.77.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.78.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.78.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.78.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.78.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.78.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.78.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.79.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.79.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.79.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.79.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.79.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.79.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.8.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.8.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.8.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.8.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.8.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.8.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.80.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.80.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.80.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.80.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.80.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.80.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.81.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.81.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.81.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.81.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.81.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.81.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.82.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.82.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.82.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.82.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.82.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.82.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.83.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.83.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.83.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.83.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.83.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.83.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.84.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.84.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.84.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.84.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.84.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.84.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.85.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.85.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.85.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.85.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.85.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.85.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.86.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.86.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.86.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.86.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.86.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.86.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.87.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.87.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.87.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.87.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.87.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.87.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.88.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.88.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.88.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.88.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.88.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.88.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.89.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.89.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.89.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.89.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.89.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.89.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.9.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.9.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.9.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.9.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.9.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.9.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.90.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.90.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.90.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.90.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.90.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.90.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.91.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.91.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.91.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.91.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.91.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.91.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.92.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.92.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.92.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.92.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.92.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.92.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.93.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.93.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.93.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.93.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.93.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.93.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.94.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.94.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.94.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.94.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.94.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.94.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.95.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.95.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.95.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.95.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.95.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.95.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.96.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.96.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.96.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.96.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.96.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.96.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.97.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.97.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.97.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.97.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.97.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.97.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.98.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.98.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.98.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.98.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.98.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.98.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.99.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.99.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.99.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.99.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.99.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.experts.99.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.gate.e_score_correction_bias": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.gate.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.shared_experts.down_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.shared_experts.down_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.shared_experts.gate_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.shared_experts.gate_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.shared_experts.up_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.mlp.shared_experts.up_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.post_attention_layernorm.weight": "model-00055-of-00092.safetensors", + "model.layers.54.self_attn.k_norm.weight": "model-00055-of-00092.safetensors", + "model.layers.54.self_attn.k_proj.bias": "model-00055-of-00092.safetensors", + "model.layers.54.self_attn.k_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.self_attn.k_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.self_attn.o_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.self_attn.o_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.self_attn.q_norm.weight": "model-00055-of-00092.safetensors", + "model.layers.54.self_attn.q_proj.bias": "model-00055-of-00092.safetensors", + "model.layers.54.self_attn.q_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.self_attn.q_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.54.self_attn.v_proj.bias": "model-00055-of-00092.safetensors", + "model.layers.54.self_attn.v_proj.weight": "model-00055-of-00092.safetensors", + "model.layers.54.self_attn.v_proj.weight_scale": "model-00055-of-00092.safetensors", + "model.layers.55.input_layernorm.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.0.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.0.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.0.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.0.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.0.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.0.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.1.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.1.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.1.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.1.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.1.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.1.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.10.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.10.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.10.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.10.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.10.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.10.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.100.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.100.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.100.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.100.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.100.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.100.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.101.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.101.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.101.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.101.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.101.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.101.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.102.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.102.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.102.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.102.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.102.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.102.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.103.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.103.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.103.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.103.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.103.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.103.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.104.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.104.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.104.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.104.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.104.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.104.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.105.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.105.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.105.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.105.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.105.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.105.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.106.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.106.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.106.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.106.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.106.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.106.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.107.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.107.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.107.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.107.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.107.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.107.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.108.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.108.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.108.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.108.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.108.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.108.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.109.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.109.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.109.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.109.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.109.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.109.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.11.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.11.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.11.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.11.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.11.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.11.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.110.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.110.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.110.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.110.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.110.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.110.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.111.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.111.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.111.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.111.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.111.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.111.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.112.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.112.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.112.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.112.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.112.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.112.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.113.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.113.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.113.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.113.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.113.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.113.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.114.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.114.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.114.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.114.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.114.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.114.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.115.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.115.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.115.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.115.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.115.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.115.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.116.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.116.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.116.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.116.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.116.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.116.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.117.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.117.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.117.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.117.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.117.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.117.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.118.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.118.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.118.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.118.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.118.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.118.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.119.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.119.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.119.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.119.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.119.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.119.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.12.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.12.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.12.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.12.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.12.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.12.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.120.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.120.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.120.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.120.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.120.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.120.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.121.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.121.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.121.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.121.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.121.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.121.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.122.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.122.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.122.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.122.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.122.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.122.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.123.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.123.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.123.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.123.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.123.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.123.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.124.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.124.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.124.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.124.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.124.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.124.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.125.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.125.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.125.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.125.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.125.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.125.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.126.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.126.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.126.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.126.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.126.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.126.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.127.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.127.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.127.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.127.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.127.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.127.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.128.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.128.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.128.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.128.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.128.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.128.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.129.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.129.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.129.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.129.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.129.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.129.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.13.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.13.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.13.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.13.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.13.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.13.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.130.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.130.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.130.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.130.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.130.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.130.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.131.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.131.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.131.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.131.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.131.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.131.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.132.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.132.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.132.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.132.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.132.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.132.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.133.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.133.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.133.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.133.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.133.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.133.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.134.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.134.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.134.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.134.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.134.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.134.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.135.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.135.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.135.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.135.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.135.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.135.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.136.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.136.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.136.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.136.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.136.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.136.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.137.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.137.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.137.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.137.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.137.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.137.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.138.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.138.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.138.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.138.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.138.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.138.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.139.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.139.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.139.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.139.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.139.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.139.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.14.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.14.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.14.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.14.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.14.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.14.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.140.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.140.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.140.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.140.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.140.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.140.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.141.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.141.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.141.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.141.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.141.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.141.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.142.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.142.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.142.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.142.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.142.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.142.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.143.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.143.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.143.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.143.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.143.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.143.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.144.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.144.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.144.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.144.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.144.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.144.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.145.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.145.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.145.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.145.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.145.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.145.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.146.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.146.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.146.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.146.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.146.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.146.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.147.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.147.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.147.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.147.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.147.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.147.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.148.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.148.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.148.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.148.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.148.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.148.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.149.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.149.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.149.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.149.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.149.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.149.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.15.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.15.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.15.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.15.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.15.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.15.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.150.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.150.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.150.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.150.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.150.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.150.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.151.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.151.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.151.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.151.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.151.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.151.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.152.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.152.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.152.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.152.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.152.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.152.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.153.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.153.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.153.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.153.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.153.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.153.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.154.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.154.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.154.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.154.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.154.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.154.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.155.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.155.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.155.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.155.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.155.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.155.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.156.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.156.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.156.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.156.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.156.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.156.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.157.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.157.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.157.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.157.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.157.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.157.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.158.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.158.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.158.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.158.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.158.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.158.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.159.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.159.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.159.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.159.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.159.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.159.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.16.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.16.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.16.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.16.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.16.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.16.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.17.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.17.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.17.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.17.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.17.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.17.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.18.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.18.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.18.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.18.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.18.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.18.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.19.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.19.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.19.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.19.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.19.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.19.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.2.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.2.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.2.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.2.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.2.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.2.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.20.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.20.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.20.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.20.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.20.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.20.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.21.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.21.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.21.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.21.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.21.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.21.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.22.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.22.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.22.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.22.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.22.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.22.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.23.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.23.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.23.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.23.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.23.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.23.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.24.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.24.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.24.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.24.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.24.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.24.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.25.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.25.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.25.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.25.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.25.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.25.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.26.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.26.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.26.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.26.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.26.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.26.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.27.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.27.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.27.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.27.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.27.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.27.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.28.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.28.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.28.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.28.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.28.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.28.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.29.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.29.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.29.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.29.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.29.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.29.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.3.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.3.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.3.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.3.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.3.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.3.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.30.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.30.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.30.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.30.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.30.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.30.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.31.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.31.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.31.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.31.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.31.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.31.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.32.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.32.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.32.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.32.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.32.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.32.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.33.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.33.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.33.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.33.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.33.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.33.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.34.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.34.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.34.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.34.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.34.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.34.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.35.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.35.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.35.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.35.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.35.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.35.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.36.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.36.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.36.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.36.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.36.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.36.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.37.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.37.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.37.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.37.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.37.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.37.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.38.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.38.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.38.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.38.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.38.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.38.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.39.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.39.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.39.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.39.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.39.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.39.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.4.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.4.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.4.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.4.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.4.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.4.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.40.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.40.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.40.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.40.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.40.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.40.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.41.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.41.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.41.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.41.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.41.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.41.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.42.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.42.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.42.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.42.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.42.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.42.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.43.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.43.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.43.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.43.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.43.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.43.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.44.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.44.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.44.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.44.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.44.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.44.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.45.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.45.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.45.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.45.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.45.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.45.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.46.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.46.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.46.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.46.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.46.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.46.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.47.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.47.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.47.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.47.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.47.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.47.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.48.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.48.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.48.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.48.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.48.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.48.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.49.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.49.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.49.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.49.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.49.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.49.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.5.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.5.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.5.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.5.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.5.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.5.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.50.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.50.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.50.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.50.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.50.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.50.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.51.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.51.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.51.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.51.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.51.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.51.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.52.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.52.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.52.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.52.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.52.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.52.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.53.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.53.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.53.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.53.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.53.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.53.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.54.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.54.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.54.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.54.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.54.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.54.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.55.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.55.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.55.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.55.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.55.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.55.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.56.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.56.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.56.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.56.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.56.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.56.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.57.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.57.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.57.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.57.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.57.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.57.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.58.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.58.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.58.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.58.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.58.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.58.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.59.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.59.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.59.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.59.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.59.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.59.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.6.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.6.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.6.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.6.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.6.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.6.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.60.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.60.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.60.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.60.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.60.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.60.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.61.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.61.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.61.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.61.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.61.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.61.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.62.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.62.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.62.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.62.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.62.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.62.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.63.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.63.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.63.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.63.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.63.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.63.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.64.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.64.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.64.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.64.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.64.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.64.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.65.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.65.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.65.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.65.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.65.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.65.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.66.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.66.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.66.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.66.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.66.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.66.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.67.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.67.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.67.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.67.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.67.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.67.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.68.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.68.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.68.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.68.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.68.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.68.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.69.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.69.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.69.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.69.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.69.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.69.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.7.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.7.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.7.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.7.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.7.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.7.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.70.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.70.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.70.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.70.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.70.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.70.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.71.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.71.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.71.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.71.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.71.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.71.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.72.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.72.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.72.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.72.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.72.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.72.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.73.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.73.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.73.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.73.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.73.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.73.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.74.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.74.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.74.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.74.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.74.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.74.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.75.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.75.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.75.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.75.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.75.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.75.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.76.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.76.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.76.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.76.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.76.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.76.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.77.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.77.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.77.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.77.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.77.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.77.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.78.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.78.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.78.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.78.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.78.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.78.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.79.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.79.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.79.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.79.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.79.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.79.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.8.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.8.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.8.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.8.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.8.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.8.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.80.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.80.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.80.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.80.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.80.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.80.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.81.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.81.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.81.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.81.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.81.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.81.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.82.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.82.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.82.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.82.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.82.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.82.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.83.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.83.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.83.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.83.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.83.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.83.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.84.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.84.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.84.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.84.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.84.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.84.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.85.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.85.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.85.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.85.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.85.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.85.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.86.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.86.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.86.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.86.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.86.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.86.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.87.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.87.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.87.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.87.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.87.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.87.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.88.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.88.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.88.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.88.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.88.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.88.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.89.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.89.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.89.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.89.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.89.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.89.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.9.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.9.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.9.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.9.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.9.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.9.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.90.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.90.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.90.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.90.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.90.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.90.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.91.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.91.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.91.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.91.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.91.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.91.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.92.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.92.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.92.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.92.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.92.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.92.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.93.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.93.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.93.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.93.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.93.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.93.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.94.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.94.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.94.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.94.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.94.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.94.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.95.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.95.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.95.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.95.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.95.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.95.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.96.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.96.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.96.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.96.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.96.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.96.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.97.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.97.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.97.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.97.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.97.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.97.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.98.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.98.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.98.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.98.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.98.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.98.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.99.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.99.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.99.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.99.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.99.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.experts.99.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.gate.e_score_correction_bias": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.gate.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.shared_experts.down_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.shared_experts.down_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.shared_experts.gate_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.shared_experts.gate_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.shared_experts.up_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.mlp.shared_experts.up_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.post_attention_layernorm.weight": "model-00056-of-00092.safetensors", + "model.layers.55.self_attn.k_norm.weight": "model-00056-of-00092.safetensors", + "model.layers.55.self_attn.k_proj.bias": "model-00056-of-00092.safetensors", + "model.layers.55.self_attn.k_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.self_attn.k_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.self_attn.o_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.self_attn.o_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.self_attn.q_norm.weight": "model-00056-of-00092.safetensors", + "model.layers.55.self_attn.q_proj.bias": "model-00056-of-00092.safetensors", + "model.layers.55.self_attn.q_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.self_attn.q_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.55.self_attn.v_proj.bias": "model-00056-of-00092.safetensors", + "model.layers.55.self_attn.v_proj.weight": "model-00056-of-00092.safetensors", + "model.layers.55.self_attn.v_proj.weight_scale": "model-00056-of-00092.safetensors", + "model.layers.56.input_layernorm.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.0.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.0.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.0.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.0.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.0.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.0.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.1.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.1.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.1.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.1.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.1.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.1.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.10.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.10.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.10.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.10.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.10.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.10.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.100.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.100.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.100.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.100.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.100.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.100.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.101.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.101.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.101.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.101.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.101.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.101.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.102.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.102.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.102.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.102.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.102.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.102.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.103.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.103.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.103.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.103.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.103.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.103.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.104.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.104.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.104.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.104.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.104.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.104.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.105.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.105.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.105.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.105.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.105.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.105.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.106.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.106.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.106.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.106.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.106.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.106.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.107.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.107.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.107.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.107.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.107.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.107.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.108.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.108.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.108.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.108.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.108.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.108.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.109.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.109.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.109.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.109.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.109.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.109.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.11.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.11.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.11.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.11.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.11.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.11.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.110.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.110.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.110.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.110.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.110.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.110.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.111.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.111.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.111.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.111.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.111.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.111.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.112.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.112.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.112.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.112.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.112.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.112.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.113.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.113.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.113.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.113.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.113.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.113.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.114.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.114.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.114.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.114.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.114.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.114.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.115.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.115.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.115.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.115.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.115.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.115.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.116.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.116.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.116.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.116.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.116.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.116.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.117.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.117.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.117.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.117.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.117.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.117.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.118.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.118.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.118.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.118.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.118.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.118.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.119.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.119.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.119.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.119.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.119.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.119.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.12.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.12.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.12.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.12.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.12.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.12.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.120.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.120.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.120.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.120.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.120.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.120.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.121.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.121.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.121.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.121.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.121.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.121.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.122.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.122.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.122.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.122.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.122.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.122.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.123.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.123.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.123.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.123.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.123.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.123.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.124.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.124.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.124.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.124.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.124.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.124.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.125.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.125.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.125.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.125.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.125.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.125.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.126.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.126.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.126.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.126.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.126.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.126.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.127.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.127.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.127.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.127.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.127.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.127.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.128.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.128.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.128.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.128.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.128.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.128.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.129.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.129.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.129.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.129.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.129.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.129.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.13.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.13.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.13.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.13.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.13.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.13.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.130.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.130.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.130.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.130.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.130.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.130.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.131.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.131.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.131.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.131.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.131.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.131.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.132.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.132.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.132.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.132.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.132.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.132.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.133.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.133.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.133.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.133.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.133.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.133.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.134.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.134.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.134.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.134.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.134.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.134.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.135.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.135.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.135.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.135.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.135.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.135.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.136.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.136.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.136.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.136.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.136.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.136.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.137.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.137.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.137.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.137.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.137.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.137.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.138.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.138.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.138.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.138.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.138.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.138.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.139.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.139.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.139.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.139.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.139.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.139.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.14.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.14.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.14.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.14.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.14.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.14.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.140.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.140.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.140.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.140.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.140.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.140.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.141.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.141.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.141.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.141.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.141.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.141.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.142.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.142.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.142.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.142.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.142.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.142.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.143.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.143.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.143.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.143.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.143.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.143.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.144.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.144.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.144.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.144.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.144.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.144.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.145.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.145.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.145.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.145.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.145.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.145.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.146.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.146.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.146.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.146.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.146.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.146.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.147.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.147.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.147.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.147.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.147.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.147.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.148.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.148.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.148.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.148.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.148.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.148.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.149.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.149.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.149.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.149.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.149.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.149.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.15.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.15.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.15.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.15.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.15.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.15.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.150.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.150.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.150.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.150.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.150.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.150.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.151.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.151.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.151.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.151.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.151.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.151.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.152.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.152.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.152.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.152.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.152.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.152.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.153.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.153.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.153.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.153.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.153.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.153.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.154.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.154.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.154.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.154.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.154.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.154.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.155.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.155.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.155.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.155.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.155.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.155.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.156.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.156.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.156.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.156.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.156.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.156.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.157.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.157.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.157.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.157.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.157.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.157.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.158.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.158.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.158.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.158.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.158.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.158.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.159.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.159.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.159.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.159.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.159.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.159.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.16.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.16.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.16.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.16.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.16.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.16.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.17.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.17.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.17.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.17.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.17.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.17.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.18.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.18.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.18.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.18.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.18.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.18.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.19.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.19.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.19.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.19.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.19.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.19.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.2.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.2.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.2.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.2.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.2.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.2.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.20.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.20.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.20.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.20.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.20.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.20.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.21.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.21.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.21.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.21.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.21.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.21.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.22.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.22.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.22.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.22.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.22.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.22.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.23.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.23.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.23.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.23.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.23.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.23.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.24.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.24.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.24.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.24.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.24.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.24.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.25.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.25.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.25.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.25.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.25.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.25.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.26.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.26.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.26.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.26.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.26.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.26.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.27.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.27.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.27.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.27.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.27.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.27.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.28.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.28.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.28.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.28.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.28.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.28.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.29.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.29.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.29.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.29.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.29.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.29.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.3.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.3.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.3.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.3.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.3.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.3.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.30.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.30.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.30.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.30.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.30.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.30.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.31.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.31.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.31.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.31.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.31.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.31.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.32.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.32.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.32.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.32.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.32.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.32.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.33.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.33.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.33.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.33.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.33.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.33.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.34.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.34.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.34.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.34.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.34.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.34.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.35.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.35.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.35.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.35.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.35.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.35.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.36.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.36.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.36.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.36.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.36.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.36.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.37.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.37.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.37.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.37.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.37.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.37.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.38.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.38.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.38.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.38.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.38.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.38.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.39.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.39.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.39.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.39.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.39.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.39.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.4.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.4.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.4.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.4.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.4.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.4.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.40.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.40.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.40.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.40.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.40.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.40.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.41.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.41.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.41.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.41.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.41.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.41.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.42.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.42.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.42.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.42.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.42.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.42.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.43.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.43.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.43.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.43.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.43.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.43.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.44.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.44.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.44.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.44.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.44.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.44.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.45.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.45.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.45.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.45.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.45.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.45.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.46.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.46.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.46.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.46.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.46.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.46.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.47.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.47.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.47.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.47.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.47.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.47.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.48.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.48.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.48.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.48.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.48.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.48.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.49.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.49.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.49.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.49.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.49.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.49.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.5.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.5.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.5.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.5.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.5.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.5.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.50.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.50.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.50.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.50.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.50.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.50.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.51.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.51.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.51.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.51.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.51.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.51.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.52.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.52.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.52.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.52.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.52.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.52.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.53.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.53.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.53.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.53.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.53.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.53.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.54.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.54.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.54.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.54.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.54.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.54.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.55.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.55.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.55.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.55.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.55.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.55.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.56.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.56.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.56.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.56.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.56.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.56.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.57.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.57.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.57.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.57.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.57.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.57.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.58.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.58.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.58.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.58.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.58.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.58.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.59.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.59.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.59.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.59.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.59.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.59.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.6.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.6.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.6.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.6.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.6.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.6.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.60.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.60.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.60.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.60.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.60.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.60.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.61.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.61.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.61.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.61.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.61.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.61.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.62.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.62.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.62.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.62.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.62.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.62.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.63.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.63.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.63.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.63.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.63.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.63.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.64.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.64.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.64.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.64.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.64.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.64.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.65.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.65.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.65.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.65.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.65.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.65.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.66.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.66.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.66.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.66.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.66.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.66.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.67.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.67.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.67.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.67.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.67.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.67.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.68.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.68.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.68.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.68.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.68.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.68.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.69.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.69.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.69.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.69.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.69.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.69.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.7.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.7.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.7.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.7.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.7.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.7.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.70.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.70.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.70.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.70.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.70.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.70.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.71.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.71.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.71.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.71.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.71.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.71.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.72.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.72.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.72.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.72.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.72.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.72.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.73.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.73.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.73.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.73.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.73.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.73.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.74.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.74.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.74.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.74.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.74.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.74.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.75.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.75.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.75.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.75.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.75.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.75.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.76.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.76.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.76.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.76.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.76.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.76.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.77.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.77.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.77.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.77.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.77.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.77.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.78.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.78.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.78.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.78.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.78.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.78.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.79.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.79.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.79.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.79.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.79.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.79.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.8.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.8.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.8.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.8.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.8.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.8.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.80.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.80.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.80.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.80.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.80.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.80.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.81.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.81.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.81.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.81.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.81.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.81.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.82.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.82.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.82.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.82.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.82.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.82.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.83.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.83.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.83.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.83.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.83.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.83.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.84.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.84.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.84.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.84.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.84.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.84.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.85.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.85.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.85.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.85.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.85.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.85.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.86.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.86.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.86.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.86.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.86.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.86.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.87.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.87.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.87.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.87.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.87.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.87.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.88.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.88.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.88.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.88.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.88.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.88.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.89.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.89.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.89.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.89.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.89.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.89.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.9.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.9.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.9.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.9.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.9.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.9.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.90.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.90.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.90.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.90.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.90.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.90.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.91.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.91.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.91.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.91.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.91.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.91.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.92.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.92.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.92.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.92.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.92.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.92.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.93.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.93.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.93.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.93.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.93.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.93.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.94.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.94.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.94.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.94.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.94.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.94.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.95.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.95.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.95.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.95.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.95.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.95.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.96.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.96.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.96.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.96.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.96.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.96.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.97.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.97.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.97.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.97.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.97.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.97.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.98.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.98.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.98.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.98.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.98.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.98.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.99.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.99.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.99.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.99.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.99.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.experts.99.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.gate.e_score_correction_bias": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.gate.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.shared_experts.down_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.shared_experts.down_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.shared_experts.gate_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.shared_experts.gate_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.shared_experts.up_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.mlp.shared_experts.up_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.post_attention_layernorm.weight": "model-00057-of-00092.safetensors", + "model.layers.56.self_attn.k_norm.weight": "model-00057-of-00092.safetensors", + "model.layers.56.self_attn.k_proj.bias": "model-00057-of-00092.safetensors", + "model.layers.56.self_attn.k_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.self_attn.k_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.self_attn.o_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.self_attn.o_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.self_attn.q_norm.weight": "model-00057-of-00092.safetensors", + "model.layers.56.self_attn.q_proj.bias": "model-00057-of-00092.safetensors", + "model.layers.56.self_attn.q_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.self_attn.q_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.56.self_attn.v_proj.bias": "model-00057-of-00092.safetensors", + "model.layers.56.self_attn.v_proj.weight": "model-00057-of-00092.safetensors", + "model.layers.56.self_attn.v_proj.weight_scale": "model-00057-of-00092.safetensors", + "model.layers.57.input_layernorm.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.0.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.0.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.0.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.0.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.0.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.0.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.1.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.1.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.1.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.1.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.1.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.1.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.10.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.10.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.10.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.10.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.10.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.10.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.100.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.100.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.100.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.100.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.100.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.100.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.101.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.101.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.101.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.101.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.101.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.101.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.102.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.102.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.102.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.102.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.102.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.102.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.103.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.103.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.103.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.103.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.103.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.103.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.104.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.104.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.104.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.104.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.104.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.104.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.105.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.105.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.105.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.105.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.105.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.105.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.106.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.106.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.106.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.106.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.106.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.106.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.107.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.107.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.107.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.107.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.107.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.107.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.108.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.108.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.108.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.108.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.108.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.108.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.109.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.109.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.109.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.109.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.109.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.109.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.11.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.11.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.11.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.11.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.11.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.11.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.110.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.110.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.110.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.110.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.110.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.110.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.111.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.111.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.111.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.111.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.111.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.111.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.112.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.112.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.112.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.112.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.112.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.112.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.113.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.113.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.113.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.113.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.113.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.113.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.114.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.114.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.114.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.114.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.114.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.114.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.115.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.115.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.115.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.115.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.115.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.115.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.116.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.116.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.116.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.116.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.116.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.116.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.117.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.117.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.117.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.117.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.117.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.117.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.118.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.118.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.118.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.118.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.118.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.118.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.119.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.119.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.119.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.119.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.119.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.119.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.12.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.12.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.12.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.12.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.12.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.12.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.120.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.120.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.120.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.120.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.120.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.120.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.121.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.121.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.121.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.121.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.121.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.121.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.122.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.122.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.122.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.122.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.122.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.122.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.123.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.123.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.123.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.123.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.123.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.123.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.124.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.124.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.124.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.124.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.124.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.124.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.125.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.125.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.125.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.125.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.125.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.125.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.126.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.126.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.126.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.126.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.126.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.126.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.127.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.127.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.127.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.127.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.127.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.127.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.128.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.128.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.128.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.128.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.128.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.128.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.129.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.129.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.129.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.129.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.129.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.129.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.13.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.13.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.13.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.13.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.13.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.13.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.130.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.130.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.130.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.130.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.130.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.130.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.131.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.131.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.131.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.131.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.131.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.131.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.132.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.132.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.132.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.132.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.132.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.132.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.133.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.133.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.133.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.133.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.133.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.133.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.134.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.134.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.134.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.134.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.134.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.134.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.135.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.135.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.135.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.135.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.135.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.135.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.136.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.136.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.136.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.136.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.136.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.136.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.137.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.137.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.137.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.137.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.137.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.137.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.138.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.138.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.138.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.138.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.138.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.138.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.139.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.139.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.139.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.139.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.139.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.139.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.14.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.14.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.14.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.14.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.14.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.14.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.140.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.140.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.140.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.140.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.140.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.140.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.141.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.141.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.141.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.141.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.141.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.141.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.142.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.142.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.142.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.142.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.142.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.142.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.143.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.143.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.143.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.143.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.143.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.143.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.144.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.144.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.144.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.144.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.144.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.144.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.145.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.145.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.145.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.145.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.145.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.145.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.146.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.146.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.146.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.146.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.146.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.146.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.147.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.147.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.147.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.147.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.147.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.147.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.148.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.148.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.148.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.148.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.148.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.148.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.149.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.149.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.149.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.149.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.149.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.149.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.15.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.15.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.15.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.15.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.15.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.15.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.150.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.150.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.150.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.150.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.150.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.150.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.151.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.151.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.151.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.151.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.151.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.151.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.152.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.152.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.152.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.152.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.152.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.152.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.153.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.153.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.153.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.153.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.153.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.153.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.154.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.154.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.154.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.154.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.154.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.154.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.155.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.155.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.155.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.155.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.155.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.155.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.156.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.156.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.156.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.156.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.156.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.156.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.157.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.157.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.157.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.157.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.157.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.157.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.158.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.158.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.158.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.158.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.158.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.158.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.159.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.159.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.159.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.159.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.159.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.159.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.16.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.16.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.16.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.16.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.16.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.16.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.17.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.17.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.17.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.17.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.17.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.17.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.18.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.18.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.18.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.18.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.18.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.18.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.19.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.19.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.19.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.19.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.19.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.19.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.2.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.2.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.2.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.2.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.2.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.2.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.20.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.20.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.20.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.20.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.20.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.20.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.21.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.21.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.21.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.21.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.21.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.21.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.22.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.22.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.22.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.22.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.22.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.22.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.23.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.23.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.23.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.23.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.23.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.23.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.24.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.24.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.24.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.24.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.24.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.24.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.25.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.25.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.25.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.25.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.25.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.25.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.26.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.26.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.26.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.26.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.26.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.26.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.27.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.27.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.27.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.27.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.27.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.27.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.28.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.28.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.28.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.28.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.28.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.28.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.29.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.29.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.29.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.29.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.29.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.29.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.3.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.3.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.3.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.3.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.3.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.3.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.30.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.30.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.30.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.30.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.30.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.30.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.31.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.31.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.31.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.31.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.31.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.31.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.32.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.32.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.32.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.32.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.32.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.32.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.33.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.33.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.33.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.33.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.33.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.33.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.34.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.34.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.34.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.34.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.34.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.34.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.35.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.35.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.35.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.35.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.35.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.35.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.36.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.36.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.36.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.36.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.36.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.36.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.37.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.37.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.37.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.37.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.37.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.37.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.38.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.38.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.38.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.38.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.38.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.38.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.39.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.39.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.39.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.39.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.39.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.39.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.4.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.4.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.4.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.4.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.4.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.4.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.40.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.40.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.40.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.40.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.40.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.40.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.41.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.41.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.41.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.41.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.41.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.41.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.42.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.42.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.42.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.42.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.42.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.42.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.43.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.43.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.43.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.43.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.43.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.43.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.44.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.44.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.44.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.44.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.44.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.44.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.45.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.45.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.45.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.45.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.45.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.45.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.46.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.46.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.46.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.46.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.46.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.46.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.47.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.47.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.47.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.47.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.47.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.47.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.48.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.48.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.48.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.48.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.48.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.48.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.49.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.49.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.49.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.49.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.49.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.49.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.5.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.5.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.5.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.5.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.5.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.5.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.50.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.50.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.50.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.50.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.50.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.50.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.51.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.51.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.51.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.51.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.51.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.51.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.52.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.52.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.52.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.52.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.52.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.52.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.53.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.53.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.53.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.53.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.53.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.53.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.54.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.54.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.54.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.54.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.54.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.54.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.55.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.55.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.55.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.55.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.55.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.55.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.56.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.56.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.56.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.56.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.56.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.56.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.57.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.57.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.57.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.57.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.57.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.57.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.58.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.58.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.58.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.58.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.58.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.58.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.59.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.59.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.59.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.59.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.59.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.59.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.6.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.6.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.6.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.6.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.6.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.6.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.60.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.60.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.60.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.60.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.60.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.60.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.61.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.61.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.61.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.61.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.61.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.61.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.62.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.62.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.62.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.62.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.62.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.62.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.63.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.63.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.63.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.63.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.63.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.63.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.64.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.64.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.64.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.64.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.64.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.64.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.65.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.65.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.65.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.65.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.65.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.65.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.66.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.66.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.66.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.66.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.66.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.66.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.67.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.67.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.67.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.67.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.67.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.67.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.68.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.68.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.68.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.68.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.68.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.68.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.69.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.69.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.69.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.69.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.69.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.69.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.7.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.7.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.7.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.7.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.7.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.7.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.70.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.70.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.70.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.70.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.70.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.70.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.71.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.71.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.71.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.71.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.71.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.71.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.72.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.72.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.72.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.72.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.72.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.72.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.73.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.73.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.73.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.73.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.73.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.73.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.74.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.74.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.74.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.74.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.74.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.74.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.75.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.75.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.75.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.75.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.75.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.75.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.76.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.76.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.76.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.76.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.76.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.76.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.77.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.77.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.77.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.77.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.77.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.77.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.78.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.78.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.78.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.78.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.78.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.78.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.79.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.79.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.79.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.79.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.79.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.79.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.8.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.8.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.8.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.8.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.8.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.8.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.80.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.80.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.80.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.80.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.80.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.80.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.81.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.81.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.81.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.81.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.81.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.81.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.82.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.82.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.82.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.82.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.82.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.82.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.83.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.83.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.83.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.83.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.83.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.83.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.84.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.84.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.84.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.84.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.84.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.84.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.85.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.85.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.85.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.85.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.85.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.85.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.86.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.86.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.86.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.86.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.86.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.86.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.87.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.87.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.87.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.87.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.87.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.87.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.88.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.88.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.88.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.88.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.88.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.88.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.89.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.89.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.89.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.89.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.89.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.89.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.9.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.9.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.9.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.9.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.9.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.9.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.90.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.90.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.90.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.90.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.90.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.90.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.91.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.91.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.91.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.91.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.91.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.91.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.92.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.92.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.92.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.92.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.92.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.92.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.93.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.93.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.93.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.93.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.93.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.93.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.94.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.94.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.94.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.94.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.94.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.94.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.95.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.95.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.95.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.95.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.95.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.95.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.96.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.96.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.96.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.96.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.96.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.96.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.97.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.97.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.97.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.97.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.97.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.97.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.98.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.98.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.98.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.98.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.98.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.98.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.99.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.99.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.99.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.99.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.99.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.experts.99.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.gate.e_score_correction_bias": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.gate.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.shared_experts.down_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.shared_experts.down_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.shared_experts.gate_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.shared_experts.gate_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.shared_experts.up_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.mlp.shared_experts.up_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.post_attention_layernorm.weight": "model-00058-of-00092.safetensors", + "model.layers.57.self_attn.k_norm.weight": "model-00058-of-00092.safetensors", + "model.layers.57.self_attn.k_proj.bias": "model-00058-of-00092.safetensors", + "model.layers.57.self_attn.k_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.self_attn.k_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.self_attn.o_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.self_attn.o_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.self_attn.q_norm.weight": "model-00058-of-00092.safetensors", + "model.layers.57.self_attn.q_proj.bias": "model-00058-of-00092.safetensors", + "model.layers.57.self_attn.q_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.self_attn.q_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.57.self_attn.v_proj.bias": "model-00058-of-00092.safetensors", + "model.layers.57.self_attn.v_proj.weight": "model-00058-of-00092.safetensors", + "model.layers.57.self_attn.v_proj.weight_scale": "model-00058-of-00092.safetensors", + "model.layers.58.input_layernorm.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.0.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.0.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.0.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.0.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.0.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.0.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.1.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.1.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.1.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.1.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.1.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.1.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.10.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.10.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.10.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.10.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.10.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.10.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.100.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.100.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.100.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.100.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.100.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.100.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.101.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.101.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.101.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.101.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.101.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.101.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.102.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.102.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.102.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.102.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.102.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.102.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.103.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.103.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.103.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.103.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.103.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.103.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.104.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.104.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.104.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.104.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.104.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.104.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.105.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.105.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.105.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.105.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.105.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.105.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.106.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.106.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.106.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.106.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.106.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.106.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.107.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.107.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.107.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.107.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.107.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.107.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.108.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.108.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.108.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.108.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.108.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.108.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.109.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.109.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.109.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.109.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.109.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.109.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.11.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.11.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.11.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.11.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.11.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.11.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.110.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.110.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.110.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.110.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.110.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.110.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.111.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.111.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.111.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.111.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.111.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.111.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.112.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.112.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.112.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.112.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.112.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.112.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.113.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.113.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.113.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.113.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.113.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.113.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.114.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.114.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.114.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.114.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.114.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.114.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.115.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.115.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.115.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.115.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.115.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.115.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.116.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.116.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.116.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.116.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.116.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.116.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.117.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.117.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.117.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.117.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.117.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.117.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.118.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.118.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.118.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.118.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.118.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.118.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.119.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.119.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.119.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.119.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.119.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.119.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.12.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.12.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.12.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.12.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.12.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.12.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.120.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.120.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.120.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.120.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.120.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.120.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.121.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.121.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.121.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.121.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.121.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.121.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.122.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.122.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.122.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.122.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.122.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.122.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.123.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.123.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.123.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.123.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.123.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.123.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.124.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.124.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.124.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.124.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.124.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.124.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.125.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.125.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.125.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.125.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.125.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.125.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.126.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.126.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.126.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.126.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.126.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.126.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.127.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.127.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.127.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.127.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.127.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.127.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.128.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.128.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.128.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.128.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.128.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.128.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.129.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.129.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.129.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.129.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.129.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.129.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.13.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.13.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.13.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.13.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.13.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.13.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.130.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.130.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.130.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.130.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.130.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.130.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.131.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.131.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.131.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.131.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.131.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.131.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.132.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.132.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.132.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.132.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.132.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.132.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.133.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.133.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.133.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.133.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.133.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.133.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.134.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.134.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.134.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.134.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.134.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.134.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.135.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.135.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.135.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.135.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.135.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.135.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.136.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.136.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.136.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.136.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.136.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.136.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.137.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.137.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.137.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.137.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.137.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.137.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.138.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.138.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.138.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.138.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.138.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.138.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.139.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.139.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.139.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.139.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.139.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.139.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.14.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.14.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.14.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.14.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.14.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.14.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.140.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.140.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.140.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.140.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.140.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.140.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.141.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.141.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.141.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.141.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.141.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.141.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.142.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.142.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.142.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.142.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.142.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.142.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.143.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.143.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.143.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.143.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.143.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.143.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.144.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.144.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.144.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.144.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.144.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.144.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.145.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.145.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.145.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.145.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.145.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.145.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.146.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.146.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.146.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.146.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.146.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.146.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.147.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.147.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.147.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.147.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.147.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.147.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.148.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.148.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.148.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.148.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.148.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.148.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.149.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.149.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.149.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.149.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.149.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.149.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.15.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.15.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.15.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.15.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.15.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.15.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.150.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.150.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.150.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.150.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.150.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.150.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.151.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.151.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.151.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.151.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.151.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.151.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.152.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.152.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.152.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.152.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.152.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.152.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.153.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.153.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.153.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.153.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.153.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.153.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.154.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.154.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.154.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.154.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.154.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.154.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.155.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.155.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.155.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.155.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.155.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.155.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.156.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.156.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.156.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.156.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.156.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.156.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.157.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.157.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.157.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.157.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.157.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.157.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.158.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.158.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.158.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.158.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.158.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.158.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.159.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.159.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.159.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.159.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.159.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.159.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.16.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.16.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.16.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.16.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.16.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.16.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.17.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.17.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.17.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.17.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.17.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.17.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.18.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.18.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.18.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.18.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.18.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.18.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.19.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.19.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.19.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.19.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.19.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.19.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.2.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.2.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.2.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.2.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.2.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.2.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.20.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.20.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.20.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.20.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.20.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.20.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.21.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.21.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.21.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.21.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.21.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.21.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.22.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.22.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.22.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.22.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.22.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.22.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.23.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.23.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.23.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.23.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.23.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.23.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.24.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.24.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.24.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.24.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.24.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.24.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.25.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.25.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.25.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.25.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.25.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.25.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.26.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.26.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.26.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.26.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.26.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.26.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.27.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.27.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.27.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.27.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.27.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.27.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.28.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.28.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.28.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.28.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.28.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.28.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.29.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.29.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.29.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.29.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.29.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.29.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.3.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.3.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.3.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.3.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.3.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.3.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.30.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.30.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.30.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.30.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.30.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.30.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.31.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.31.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.31.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.31.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.31.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.31.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.32.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.32.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.32.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.32.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.32.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.32.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.33.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.33.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.33.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.33.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.33.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.33.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.34.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.34.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.34.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.34.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.34.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.34.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.35.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.35.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.35.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.35.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.35.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.35.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.36.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.36.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.36.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.36.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.36.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.36.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.37.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.37.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.37.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.37.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.37.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.37.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.38.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.38.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.38.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.38.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.38.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.38.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.39.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.39.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.39.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.39.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.39.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.39.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.4.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.4.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.4.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.4.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.4.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.4.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.40.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.40.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.40.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.40.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.40.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.40.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.41.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.41.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.41.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.41.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.41.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.41.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.42.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.42.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.42.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.42.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.42.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.42.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.43.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.43.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.43.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.43.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.43.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.43.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.44.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.44.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.44.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.44.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.44.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.44.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.45.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.45.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.45.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.45.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.45.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.45.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.46.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.46.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.46.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.46.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.46.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.46.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.47.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.47.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.47.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.47.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.47.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.47.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.48.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.48.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.48.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.48.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.48.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.48.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.49.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.49.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.49.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.49.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.49.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.49.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.5.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.5.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.5.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.5.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.5.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.5.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.50.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.50.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.50.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.50.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.50.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.50.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.51.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.51.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.51.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.51.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.51.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.51.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.52.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.52.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.52.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.52.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.52.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.52.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.53.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.53.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.53.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.53.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.53.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.53.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.54.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.54.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.54.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.54.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.54.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.54.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.55.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.55.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.55.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.55.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.55.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.55.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.56.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.56.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.56.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.56.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.56.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.56.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.57.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.57.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.57.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.57.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.57.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.57.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.58.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.58.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.58.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.58.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.58.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.58.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.59.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.59.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.59.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.59.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.59.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.59.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.6.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.6.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.6.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.6.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.6.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.6.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.60.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.60.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.60.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.60.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.60.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.60.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.61.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.61.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.61.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.61.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.61.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.61.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.62.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.62.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.62.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.62.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.62.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.62.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.63.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.63.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.63.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.63.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.63.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.63.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.64.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.64.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.64.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.64.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.64.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.64.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.65.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.65.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.65.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.65.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.65.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.65.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.66.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.66.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.66.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.66.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.66.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.66.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.67.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.67.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.67.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.67.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.67.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.67.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.68.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.68.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.68.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.68.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.68.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.68.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.69.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.69.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.69.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.69.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.69.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.69.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.7.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.7.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.7.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.7.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.7.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.7.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.70.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.70.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.70.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.70.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.70.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.70.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.71.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.71.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.71.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.71.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.71.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.71.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.72.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.72.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.72.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.72.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.72.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.72.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.73.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.73.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.73.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.73.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.73.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.73.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.74.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.74.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.74.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.74.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.74.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.74.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.75.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.75.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.75.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.75.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.75.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.75.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.76.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.76.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.76.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.76.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.76.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.76.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.77.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.77.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.77.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.77.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.77.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.77.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.78.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.78.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.78.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.78.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.78.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.78.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.79.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.79.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.79.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.79.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.79.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.79.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.8.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.8.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.8.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.8.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.8.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.8.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.80.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.80.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.80.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.80.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.80.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.80.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.81.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.81.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.81.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.81.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.81.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.81.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.82.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.82.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.82.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.82.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.82.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.82.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.83.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.83.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.83.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.83.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.83.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.83.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.84.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.84.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.84.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.84.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.84.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.84.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.85.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.85.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.85.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.85.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.85.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.85.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.86.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.86.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.86.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.86.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.86.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.86.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.87.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.87.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.87.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.87.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.87.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.87.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.88.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.88.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.88.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.88.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.88.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.88.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.89.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.89.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.89.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.89.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.89.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.89.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.9.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.9.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.9.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.9.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.9.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.9.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.90.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.90.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.90.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.90.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.90.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.90.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.91.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.91.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.91.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.91.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.91.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.91.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.92.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.92.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.92.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.92.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.92.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.92.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.93.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.93.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.93.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.93.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.93.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.93.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.94.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.94.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.94.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.94.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.94.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.94.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.95.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.95.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.95.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.95.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.95.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.95.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.96.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.96.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.96.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.96.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.96.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.96.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.97.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.97.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.97.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.97.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.97.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.97.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.98.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.98.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.98.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.98.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.98.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.98.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.99.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.99.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.99.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.99.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.99.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.experts.99.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.gate.e_score_correction_bias": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.gate.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.shared_experts.down_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.shared_experts.down_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.shared_experts.gate_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.shared_experts.gate_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.shared_experts.up_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.mlp.shared_experts.up_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.post_attention_layernorm.weight": "model-00059-of-00092.safetensors", + "model.layers.58.self_attn.k_norm.weight": "model-00059-of-00092.safetensors", + "model.layers.58.self_attn.k_proj.bias": "model-00059-of-00092.safetensors", + "model.layers.58.self_attn.k_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.self_attn.k_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.self_attn.o_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.self_attn.o_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.self_attn.q_norm.weight": "model-00059-of-00092.safetensors", + "model.layers.58.self_attn.q_proj.bias": "model-00059-of-00092.safetensors", + "model.layers.58.self_attn.q_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.self_attn.q_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.58.self_attn.v_proj.bias": "model-00059-of-00092.safetensors", + "model.layers.58.self_attn.v_proj.weight": "model-00059-of-00092.safetensors", + "model.layers.58.self_attn.v_proj.weight_scale": "model-00059-of-00092.safetensors", + "model.layers.59.input_layernorm.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.0.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.0.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.0.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.0.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.0.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.0.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.1.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.1.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.1.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.1.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.1.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.1.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.10.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.10.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.10.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.10.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.10.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.10.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.100.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.100.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.100.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.100.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.100.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.100.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.101.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.101.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.101.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.101.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.101.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.101.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.102.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.102.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.102.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.102.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.102.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.102.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.103.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.103.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.103.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.103.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.103.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.103.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.104.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.104.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.104.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.104.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.104.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.104.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.105.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.105.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.105.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.105.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.105.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.105.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.106.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.106.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.106.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.106.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.106.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.106.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.107.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.107.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.107.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.107.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.107.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.107.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.108.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.108.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.108.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.108.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.108.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.108.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.109.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.109.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.109.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.109.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.109.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.109.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.11.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.11.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.11.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.11.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.11.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.11.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.110.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.110.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.110.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.110.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.110.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.110.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.111.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.111.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.111.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.111.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.111.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.111.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.112.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.112.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.112.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.112.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.112.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.112.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.113.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.113.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.113.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.113.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.113.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.113.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.114.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.114.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.114.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.114.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.114.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.114.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.115.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.115.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.115.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.115.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.115.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.115.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.116.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.116.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.116.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.116.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.116.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.116.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.117.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.117.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.117.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.117.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.117.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.117.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.118.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.118.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.118.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.118.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.118.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.118.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.119.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.119.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.119.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.119.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.119.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.119.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.12.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.12.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.12.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.12.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.12.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.12.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.120.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.120.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.120.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.120.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.120.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.120.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.121.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.121.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.121.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.121.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.121.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.121.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.122.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.122.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.122.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.122.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.122.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.122.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.123.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.123.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.123.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.123.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.123.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.123.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.124.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.124.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.124.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.124.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.124.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.124.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.125.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.125.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.125.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.125.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.125.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.125.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.126.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.126.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.126.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.126.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.126.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.126.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.127.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.127.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.127.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.127.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.127.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.127.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.128.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.128.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.128.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.128.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.128.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.128.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.129.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.129.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.129.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.129.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.129.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.129.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.13.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.13.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.13.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.13.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.13.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.13.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.130.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.130.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.130.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.130.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.130.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.130.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.131.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.131.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.131.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.131.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.131.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.131.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.132.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.132.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.132.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.132.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.132.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.132.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.133.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.133.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.133.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.133.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.133.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.133.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.134.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.134.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.134.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.134.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.134.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.134.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.135.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.135.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.135.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.135.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.135.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.135.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.136.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.136.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.136.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.136.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.136.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.136.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.137.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.137.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.137.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.137.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.137.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.137.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.138.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.138.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.138.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.138.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.138.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.138.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.139.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.139.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.139.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.139.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.139.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.139.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.14.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.14.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.14.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.14.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.14.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.14.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.140.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.140.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.140.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.140.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.140.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.140.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.141.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.141.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.141.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.141.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.141.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.141.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.142.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.142.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.142.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.142.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.142.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.142.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.143.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.143.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.143.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.143.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.143.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.143.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.144.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.144.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.144.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.144.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.144.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.144.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.145.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.145.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.145.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.145.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.145.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.145.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.146.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.146.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.146.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.146.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.146.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.146.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.147.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.147.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.147.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.147.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.147.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.147.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.148.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.148.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.148.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.148.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.148.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.148.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.149.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.149.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.149.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.149.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.149.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.149.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.15.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.15.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.15.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.15.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.15.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.15.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.150.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.150.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.150.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.150.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.150.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.150.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.151.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.151.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.151.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.151.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.151.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.151.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.152.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.152.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.152.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.152.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.152.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.152.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.153.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.153.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.153.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.153.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.153.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.153.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.154.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.154.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.154.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.154.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.154.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.154.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.155.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.155.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.155.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.155.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.155.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.155.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.156.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.156.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.156.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.156.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.156.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.156.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.157.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.157.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.157.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.157.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.157.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.157.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.158.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.158.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.158.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.158.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.158.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.158.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.159.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.159.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.159.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.159.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.159.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.159.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.16.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.16.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.16.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.16.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.16.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.16.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.17.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.17.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.17.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.17.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.17.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.17.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.18.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.18.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.18.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.18.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.18.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.18.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.19.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.19.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.19.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.19.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.19.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.19.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.2.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.2.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.2.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.2.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.2.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.2.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.20.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.20.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.20.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.20.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.20.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.20.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.21.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.21.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.21.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.21.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.21.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.21.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.22.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.22.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.22.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.22.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.22.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.22.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.23.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.23.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.23.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.23.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.23.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.23.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.24.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.24.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.24.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.24.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.24.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.24.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.25.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.25.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.25.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.25.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.25.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.25.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.26.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.26.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.26.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.26.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.26.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.26.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.27.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.27.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.27.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.27.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.27.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.27.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.28.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.28.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.28.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.28.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.28.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.28.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.29.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.29.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.29.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.29.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.29.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.29.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.3.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.3.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.3.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.3.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.3.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.3.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.30.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.30.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.30.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.30.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.30.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.30.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.31.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.31.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.31.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.31.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.31.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.31.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.32.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.32.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.32.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.32.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.32.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.32.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.33.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.33.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.33.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.33.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.33.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.33.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.34.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.34.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.34.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.34.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.34.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.34.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.35.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.35.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.35.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.35.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.35.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.35.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.36.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.36.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.36.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.36.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.36.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.36.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.37.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.37.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.37.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.37.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.37.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.37.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.38.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.38.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.38.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.38.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.38.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.38.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.39.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.39.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.39.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.39.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.39.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.39.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.4.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.4.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.4.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.4.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.4.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.4.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.40.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.40.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.40.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.40.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.40.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.40.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.41.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.41.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.41.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.41.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.41.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.41.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.42.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.42.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.42.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.42.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.42.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.42.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.43.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.43.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.43.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.43.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.43.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.43.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.44.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.44.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.44.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.44.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.44.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.44.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.45.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.45.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.45.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.45.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.45.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.45.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.46.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.46.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.46.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.46.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.46.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.46.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.47.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.47.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.47.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.47.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.47.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.47.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.48.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.48.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.48.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.48.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.48.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.48.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.49.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.49.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.49.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.49.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.49.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.49.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.5.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.5.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.5.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.5.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.5.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.5.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.50.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.50.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.50.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.50.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.50.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.50.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.51.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.51.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.51.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.51.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.51.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.51.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.52.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.52.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.52.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.52.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.52.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.52.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.53.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.53.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.53.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.53.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.53.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.53.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.54.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.54.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.54.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.54.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.54.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.54.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.55.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.55.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.55.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.55.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.55.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.55.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.56.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.56.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.56.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.56.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.56.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.56.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.57.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.57.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.57.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.57.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.57.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.57.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.58.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.58.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.58.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.58.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.58.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.58.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.59.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.59.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.59.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.59.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.59.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.59.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.6.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.6.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.6.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.6.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.6.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.6.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.60.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.60.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.60.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.60.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.60.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.60.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.61.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.61.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.61.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.61.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.61.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.61.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.62.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.62.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.62.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.62.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.62.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.62.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.63.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.63.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.63.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.63.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.63.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.63.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.64.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.64.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.64.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.64.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.64.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.64.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.65.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.65.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.65.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.65.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.65.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.65.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.66.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.66.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.66.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.66.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.66.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.66.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.67.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.67.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.67.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.67.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.67.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.67.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.68.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.68.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.68.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.68.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.68.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.68.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.69.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.69.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.69.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.69.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.69.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.69.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.7.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.7.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.7.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.7.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.7.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.7.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.70.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.70.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.70.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.70.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.70.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.70.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.71.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.71.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.71.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.71.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.71.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.71.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.72.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.72.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.72.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.72.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.72.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.72.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.73.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.73.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.73.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.73.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.73.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.73.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.74.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.74.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.74.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.74.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.74.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.74.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.75.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.75.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.75.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.75.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.75.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.75.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.76.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.76.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.76.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.76.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.76.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.76.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.77.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.77.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.77.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.77.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.77.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.77.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.78.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.78.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.78.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.78.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.78.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.78.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.79.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.79.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.79.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.79.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.79.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.79.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.8.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.8.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.8.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.8.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.8.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.8.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.80.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.80.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.80.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.80.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.80.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.80.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.81.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.81.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.81.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.81.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.81.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.81.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.82.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.82.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.82.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.82.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.82.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.82.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.83.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.83.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.83.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.83.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.83.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.83.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.84.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.84.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.84.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.84.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.84.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.84.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.85.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.85.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.85.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.85.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.85.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.85.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.86.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.86.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.86.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.86.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.86.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.86.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.87.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.87.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.87.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.87.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.87.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.87.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.88.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.88.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.88.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.88.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.88.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.88.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.89.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.89.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.89.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.89.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.89.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.89.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.9.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.9.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.9.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.9.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.9.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.9.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.90.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.90.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.90.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.90.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.90.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.90.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.91.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.91.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.91.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.91.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.91.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.91.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.92.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.92.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.92.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.92.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.92.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.92.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.93.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.93.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.93.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.93.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.93.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.93.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.94.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.94.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.94.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.94.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.94.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.94.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.95.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.95.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.95.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.95.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.95.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.95.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.96.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.96.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.96.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.96.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.96.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.96.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.97.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.97.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.97.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.97.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.97.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.97.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.98.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.98.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.98.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.98.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.98.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.98.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.99.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.99.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.99.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.99.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.99.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.experts.99.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.gate.e_score_correction_bias": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.gate.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.shared_experts.down_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.shared_experts.down_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.shared_experts.gate_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.shared_experts.gate_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.shared_experts.up_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.mlp.shared_experts.up_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.post_attention_layernorm.weight": "model-00060-of-00092.safetensors", + "model.layers.59.self_attn.k_norm.weight": "model-00060-of-00092.safetensors", + "model.layers.59.self_attn.k_proj.bias": "model-00060-of-00092.safetensors", + "model.layers.59.self_attn.k_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.self_attn.k_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.self_attn.o_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.self_attn.o_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.self_attn.q_norm.weight": "model-00060-of-00092.safetensors", + "model.layers.59.self_attn.q_proj.bias": "model-00060-of-00092.safetensors", + "model.layers.59.self_attn.q_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.self_attn.q_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.59.self_attn.v_proj.bias": "model-00060-of-00092.safetensors", + "model.layers.59.self_attn.v_proj.weight": "model-00060-of-00092.safetensors", + "model.layers.59.self_attn.v_proj.weight_scale": "model-00060-of-00092.safetensors", + "model.layers.60.input_layernorm.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.0.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.0.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.0.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.0.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.0.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.0.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.1.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.1.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.1.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.1.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.1.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.1.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.10.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.10.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.10.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.10.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.10.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.10.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.100.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.100.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.100.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.100.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.100.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.100.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.101.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.101.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.101.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.101.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.101.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.101.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.102.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.102.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.102.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.102.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.102.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.102.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.103.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.103.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.103.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.103.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.103.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.103.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.104.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.104.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.104.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.104.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.104.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.104.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.105.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.105.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.105.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.105.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.105.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.105.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.106.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.106.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.106.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.106.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.106.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.106.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.107.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.107.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.107.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.107.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.107.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.107.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.108.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.108.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.108.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.108.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.108.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.108.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.109.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.109.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.109.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.109.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.109.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.109.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.11.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.11.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.11.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.11.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.11.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.11.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.110.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.110.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.110.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.110.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.110.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.110.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.111.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.111.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.111.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.111.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.111.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.111.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.112.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.112.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.112.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.112.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.112.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.112.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.113.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.113.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.113.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.113.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.113.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.113.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.114.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.114.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.114.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.114.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.114.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.114.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.115.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.115.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.115.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.115.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.115.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.115.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.116.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.116.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.116.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.116.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.116.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.116.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.117.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.117.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.117.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.117.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.117.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.117.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.118.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.118.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.118.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.118.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.118.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.118.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.119.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.119.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.119.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.119.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.119.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.119.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.12.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.12.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.12.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.12.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.12.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.12.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.120.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.120.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.120.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.120.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.120.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.120.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.121.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.121.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.121.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.121.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.121.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.121.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.122.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.122.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.122.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.122.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.122.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.122.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.123.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.123.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.123.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.123.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.123.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.123.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.124.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.124.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.124.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.124.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.124.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.124.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.125.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.125.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.125.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.125.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.125.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.125.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.126.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.126.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.126.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.126.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.126.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.126.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.127.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.127.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.127.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.127.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.127.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.127.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.128.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.128.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.128.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.128.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.128.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.128.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.129.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.129.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.129.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.129.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.129.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.129.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.13.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.13.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.13.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.13.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.13.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.13.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.130.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.130.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.130.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.130.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.130.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.130.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.131.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.131.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.131.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.131.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.131.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.131.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.132.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.132.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.132.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.132.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.132.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.132.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.133.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.133.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.133.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.133.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.133.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.133.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.134.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.134.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.134.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.134.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.134.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.134.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.135.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.135.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.135.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.135.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.135.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.135.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.136.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.136.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.136.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.136.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.136.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.136.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.137.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.137.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.137.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.137.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.137.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.137.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.138.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.138.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.138.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.138.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.138.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.138.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.139.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.139.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.139.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.139.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.139.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.139.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.14.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.14.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.14.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.14.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.14.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.14.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.140.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.140.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.140.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.140.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.140.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.140.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.141.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.141.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.141.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.141.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.141.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.141.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.142.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.142.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.142.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.142.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.142.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.142.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.143.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.143.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.143.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.143.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.143.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.143.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.144.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.144.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.144.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.144.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.144.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.144.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.145.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.145.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.145.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.145.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.145.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.145.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.146.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.146.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.146.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.146.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.146.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.146.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.147.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.147.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.147.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.147.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.147.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.147.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.148.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.148.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.148.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.148.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.148.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.148.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.149.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.149.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.149.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.149.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.149.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.149.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.15.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.15.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.15.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.15.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.15.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.15.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.150.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.150.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.150.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.150.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.150.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.150.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.151.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.151.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.151.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.151.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.151.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.151.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.152.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.152.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.152.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.152.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.152.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.152.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.153.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.153.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.153.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.153.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.153.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.153.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.154.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.154.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.154.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.154.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.154.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.154.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.155.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.155.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.155.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.155.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.155.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.155.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.156.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.156.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.156.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.156.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.156.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.156.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.157.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.157.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.157.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.157.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.157.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.157.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.158.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.158.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.158.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.158.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.158.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.158.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.159.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.159.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.159.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.159.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.159.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.159.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.16.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.16.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.16.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.16.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.16.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.16.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.17.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.17.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.17.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.17.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.17.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.17.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.18.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.18.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.18.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.18.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.18.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.18.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.19.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.19.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.19.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.19.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.19.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.19.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.2.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.2.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.2.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.2.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.2.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.2.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.20.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.20.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.20.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.20.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.20.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.20.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.21.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.21.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.21.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.21.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.21.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.21.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.22.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.22.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.22.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.22.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.22.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.22.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.23.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.23.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.23.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.23.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.23.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.23.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.24.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.24.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.24.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.24.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.24.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.24.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.25.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.25.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.25.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.25.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.25.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.25.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.26.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.26.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.26.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.26.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.26.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.26.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.27.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.27.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.27.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.27.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.27.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.27.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.28.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.28.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.28.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.28.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.28.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.28.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.29.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.29.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.29.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.29.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.29.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.29.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.3.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.3.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.3.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.3.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.3.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.3.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.30.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.30.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.30.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.30.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.30.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.30.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.31.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.31.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.31.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.31.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.31.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.31.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.32.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.32.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.32.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.32.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.32.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.32.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.33.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.33.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.33.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.33.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.33.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.33.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.34.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.34.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.34.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.34.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.34.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.34.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.35.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.35.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.35.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.35.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.35.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.35.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.36.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.36.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.36.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.36.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.36.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.36.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.37.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.37.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.37.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.37.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.37.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.37.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.38.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.38.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.38.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.38.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.38.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.38.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.39.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.39.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.39.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.39.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.39.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.39.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.4.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.4.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.4.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.4.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.4.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.4.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.40.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.40.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.40.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.40.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.40.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.40.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.41.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.41.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.41.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.41.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.41.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.41.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.42.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.42.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.42.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.42.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.42.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.42.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.43.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.43.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.43.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.43.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.43.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.43.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.44.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.44.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.44.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.44.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.44.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.44.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.45.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.45.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.45.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.45.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.45.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.45.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.46.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.46.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.46.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.46.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.46.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.46.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.47.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.47.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.47.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.47.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.47.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.47.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.48.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.48.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.48.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.48.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.48.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.48.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.49.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.49.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.49.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.49.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.49.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.49.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.5.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.5.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.5.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.5.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.5.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.5.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.50.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.50.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.50.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.50.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.50.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.50.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.51.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.51.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.51.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.51.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.51.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.51.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.52.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.52.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.52.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.52.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.52.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.52.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.53.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.53.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.53.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.53.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.53.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.53.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.54.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.54.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.54.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.54.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.54.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.54.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.55.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.55.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.55.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.55.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.55.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.55.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.56.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.56.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.56.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.56.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.56.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.56.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.57.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.57.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.57.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.57.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.57.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.57.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.58.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.58.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.58.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.58.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.58.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.58.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.59.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.59.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.59.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.59.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.59.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.59.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.6.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.6.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.6.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.6.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.6.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.6.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.60.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.60.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.60.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.60.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.60.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.60.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.61.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.61.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.61.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.61.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.61.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.61.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.62.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.62.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.62.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.62.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.62.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.62.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.63.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.63.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.63.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.63.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.63.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.63.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.64.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.64.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.64.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.64.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.64.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.64.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.65.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.65.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.65.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.65.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.65.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.65.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.66.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.66.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.66.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.66.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.66.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.66.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.67.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.67.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.67.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.67.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.67.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.67.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.68.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.68.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.68.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.68.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.68.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.68.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.69.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.69.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.69.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.69.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.69.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.69.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.7.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.7.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.7.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.7.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.7.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.7.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.70.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.70.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.70.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.70.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.70.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.70.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.71.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.71.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.71.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.71.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.71.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.71.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.72.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.72.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.72.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.72.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.72.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.72.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.73.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.73.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.73.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.73.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.73.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.73.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.74.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.74.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.74.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.74.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.74.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.74.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.75.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.75.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.75.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.75.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.75.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.75.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.76.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.76.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.76.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.76.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.76.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.76.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.77.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.77.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.77.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.77.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.77.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.77.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.78.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.78.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.78.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.78.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.78.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.78.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.79.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.79.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.79.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.79.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.79.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.79.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.8.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.8.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.8.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.8.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.8.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.8.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.80.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.80.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.80.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.80.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.80.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.80.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.81.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.81.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.81.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.81.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.81.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.81.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.82.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.82.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.82.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.82.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.82.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.82.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.83.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.83.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.83.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.83.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.83.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.83.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.84.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.84.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.84.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.84.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.84.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.84.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.85.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.85.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.85.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.85.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.85.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.85.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.86.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.86.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.86.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.86.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.86.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.86.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.87.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.87.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.87.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.87.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.87.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.87.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.88.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.88.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.88.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.88.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.88.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.88.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.89.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.89.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.89.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.89.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.89.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.89.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.9.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.9.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.9.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.9.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.9.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.9.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.90.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.90.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.90.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.90.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.90.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.90.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.91.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.91.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.91.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.91.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.91.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.91.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.92.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.92.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.92.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.92.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.92.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.92.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.93.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.93.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.93.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.93.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.93.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.93.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.94.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.94.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.94.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.94.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.94.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.94.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.95.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.95.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.95.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.95.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.95.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.95.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.96.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.96.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.96.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.96.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.96.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.96.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.97.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.97.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.97.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.97.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.97.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.97.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.98.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.98.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.98.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.98.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.98.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.98.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.99.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.99.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.99.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.99.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.99.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.experts.99.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.gate.e_score_correction_bias": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.gate.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.shared_experts.down_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.shared_experts.down_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.shared_experts.gate_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.shared_experts.gate_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.shared_experts.up_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.mlp.shared_experts.up_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.post_attention_layernorm.weight": "model-00061-of-00092.safetensors", + "model.layers.60.self_attn.k_norm.weight": "model-00061-of-00092.safetensors", + "model.layers.60.self_attn.k_proj.bias": "model-00061-of-00092.safetensors", + "model.layers.60.self_attn.k_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.self_attn.k_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.self_attn.o_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.self_attn.o_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.self_attn.q_norm.weight": "model-00061-of-00092.safetensors", + "model.layers.60.self_attn.q_proj.bias": "model-00061-of-00092.safetensors", + "model.layers.60.self_attn.q_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.self_attn.q_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.60.self_attn.v_proj.bias": "model-00061-of-00092.safetensors", + "model.layers.60.self_attn.v_proj.weight": "model-00061-of-00092.safetensors", + "model.layers.60.self_attn.v_proj.weight_scale": "model-00061-of-00092.safetensors", + "model.layers.61.input_layernorm.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.0.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.0.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.0.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.0.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.0.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.0.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.1.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.1.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.1.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.1.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.1.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.1.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.10.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.10.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.10.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.10.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.10.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.10.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.100.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.100.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.100.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.100.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.100.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.100.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.101.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.101.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.101.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.101.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.101.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.101.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.102.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.102.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.102.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.102.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.102.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.102.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.103.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.103.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.103.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.103.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.103.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.103.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.104.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.104.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.104.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.104.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.104.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.104.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.105.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.105.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.105.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.105.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.105.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.105.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.106.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.106.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.106.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.106.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.106.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.106.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.107.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.107.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.107.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.107.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.107.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.107.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.108.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.108.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.108.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.108.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.108.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.108.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.109.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.109.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.109.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.109.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.109.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.109.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.11.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.11.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.11.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.11.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.11.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.11.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.110.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.110.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.110.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.110.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.110.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.110.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.111.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.111.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.111.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.111.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.111.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.111.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.112.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.112.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.112.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.112.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.112.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.112.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.113.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.113.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.113.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.113.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.113.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.113.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.114.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.114.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.114.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.114.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.114.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.114.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.115.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.115.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.115.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.115.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.115.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.115.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.116.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.116.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.116.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.116.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.116.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.116.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.117.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.117.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.117.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.117.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.117.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.117.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.118.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.118.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.118.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.118.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.118.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.118.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.119.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.119.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.119.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.119.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.119.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.119.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.12.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.12.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.12.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.12.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.12.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.12.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.120.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.120.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.120.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.120.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.120.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.120.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.121.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.121.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.121.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.121.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.121.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.121.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.122.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.122.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.122.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.122.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.122.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.122.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.123.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.123.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.123.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.123.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.123.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.123.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.124.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.124.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.124.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.124.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.124.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.124.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.125.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.125.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.125.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.125.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.125.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.125.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.126.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.126.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.126.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.126.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.126.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.126.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.127.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.127.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.127.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.127.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.127.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.127.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.128.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.128.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.128.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.128.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.128.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.128.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.129.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.129.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.129.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.129.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.129.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.129.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.13.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.13.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.13.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.13.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.13.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.13.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.130.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.130.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.130.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.130.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.130.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.130.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.131.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.131.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.131.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.131.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.131.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.131.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.132.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.132.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.132.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.132.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.132.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.132.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.133.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.133.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.133.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.133.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.133.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.133.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.134.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.134.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.134.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.134.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.134.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.134.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.135.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.135.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.135.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.135.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.135.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.135.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.136.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.136.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.136.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.136.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.136.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.136.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.137.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.137.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.137.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.137.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.137.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.137.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.138.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.138.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.138.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.138.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.138.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.138.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.139.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.139.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.139.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.139.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.139.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.139.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.14.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.14.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.14.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.14.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.14.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.14.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.140.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.140.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.140.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.140.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.140.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.140.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.141.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.141.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.141.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.141.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.141.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.141.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.142.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.142.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.142.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.142.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.142.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.142.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.143.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.143.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.143.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.143.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.143.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.143.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.144.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.144.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.144.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.144.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.144.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.144.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.145.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.145.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.145.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.145.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.145.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.145.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.146.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.146.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.146.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.146.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.146.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.146.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.147.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.147.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.147.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.147.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.147.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.147.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.148.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.148.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.148.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.148.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.148.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.148.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.149.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.149.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.149.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.149.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.149.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.149.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.15.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.15.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.15.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.15.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.15.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.15.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.150.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.150.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.150.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.150.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.150.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.150.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.151.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.151.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.151.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.151.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.151.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.151.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.152.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.152.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.152.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.152.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.152.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.152.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.153.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.153.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.153.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.153.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.153.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.153.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.154.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.154.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.154.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.154.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.154.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.154.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.155.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.155.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.155.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.155.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.155.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.155.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.156.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.156.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.156.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.156.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.156.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.156.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.157.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.157.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.157.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.157.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.157.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.157.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.158.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.158.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.158.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.158.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.158.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.158.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.159.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.159.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.159.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.159.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.159.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.159.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.16.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.16.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.16.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.16.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.16.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.16.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.17.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.17.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.17.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.17.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.17.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.17.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.18.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.18.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.18.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.18.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.18.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.18.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.19.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.19.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.19.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.19.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.19.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.19.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.2.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.2.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.2.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.2.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.2.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.2.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.20.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.20.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.20.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.20.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.20.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.20.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.21.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.21.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.21.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.21.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.21.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.21.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.22.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.22.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.22.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.22.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.22.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.22.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.23.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.23.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.23.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.23.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.23.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.23.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.24.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.24.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.24.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.24.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.24.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.24.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.25.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.25.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.25.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.25.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.25.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.25.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.26.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.26.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.26.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.26.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.26.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.26.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.27.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.27.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.27.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.27.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.27.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.27.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.28.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.28.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.28.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.28.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.28.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.28.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.29.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.29.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.29.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.29.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.29.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.29.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.3.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.3.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.3.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.3.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.3.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.3.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.30.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.30.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.30.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.30.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.30.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.30.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.31.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.31.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.31.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.31.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.31.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.31.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.32.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.32.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.32.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.32.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.32.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.32.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.33.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.33.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.33.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.33.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.33.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.33.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.34.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.34.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.34.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.34.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.34.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.34.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.35.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.35.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.35.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.35.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.35.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.35.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.36.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.36.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.36.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.36.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.36.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.36.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.37.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.37.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.37.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.37.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.37.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.37.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.38.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.38.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.38.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.38.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.38.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.38.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.39.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.39.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.39.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.39.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.39.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.39.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.4.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.4.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.4.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.4.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.4.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.4.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.40.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.40.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.40.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.40.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.40.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.40.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.41.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.41.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.41.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.41.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.41.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.41.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.42.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.42.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.42.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.42.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.42.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.42.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.43.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.43.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.43.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.43.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.43.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.43.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.44.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.44.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.44.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.44.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.44.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.44.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.45.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.45.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.45.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.45.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.45.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.45.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.46.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.46.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.46.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.46.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.46.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.46.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.47.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.47.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.47.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.47.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.47.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.47.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.48.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.48.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.48.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.48.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.48.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.48.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.49.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.49.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.49.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.49.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.49.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.49.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.5.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.5.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.5.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.5.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.5.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.5.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.50.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.50.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.50.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.50.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.50.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.50.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.51.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.51.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.51.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.51.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.51.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.51.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.52.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.52.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.52.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.52.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.52.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.52.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.53.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.53.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.53.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.53.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.53.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.53.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.54.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.54.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.54.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.54.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.54.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.54.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.55.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.55.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.55.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.55.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.55.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.55.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.56.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.56.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.56.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.56.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.56.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.56.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.57.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.57.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.57.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.57.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.57.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.57.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.58.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.58.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.58.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.58.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.58.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.58.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.59.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.59.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.59.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.59.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.59.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.59.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.6.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.6.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.6.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.6.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.6.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.6.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.60.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.60.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.60.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.60.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.60.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.60.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.61.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.61.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.61.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.61.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.61.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.61.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.62.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.62.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.62.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.62.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.62.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.62.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.63.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.63.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.63.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.63.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.63.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.63.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.64.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.64.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.64.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.64.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.64.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.64.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.65.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.65.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.65.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.65.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.65.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.65.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.66.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.66.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.66.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.66.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.66.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.66.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.67.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.67.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.67.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.67.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.67.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.67.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.68.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.68.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.68.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.68.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.68.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.68.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.69.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.69.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.69.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.69.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.69.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.69.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.7.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.7.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.7.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.7.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.7.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.7.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.70.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.70.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.70.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.70.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.70.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.70.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.71.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.71.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.71.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.71.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.71.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.71.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.72.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.72.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.72.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.72.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.72.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.72.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.73.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.73.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.73.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.73.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.73.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.73.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.74.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.74.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.74.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.74.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.74.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.74.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.75.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.75.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.75.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.75.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.75.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.75.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.76.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.76.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.76.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.76.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.76.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.76.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.77.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.77.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.77.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.77.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.77.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.77.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.78.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.78.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.78.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.78.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.78.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.78.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.79.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.79.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.79.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.79.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.79.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.79.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.8.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.8.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.8.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.8.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.8.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.8.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.80.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.80.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.80.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.80.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.80.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.80.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.81.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.81.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.81.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.81.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.81.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.81.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.82.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.82.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.82.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.82.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.82.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.82.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.83.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.83.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.83.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.83.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.83.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.83.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.84.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.84.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.84.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.84.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.84.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.84.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.85.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.85.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.85.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.85.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.85.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.85.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.86.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.86.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.86.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.86.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.86.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.86.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.87.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.87.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.87.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.87.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.87.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.87.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.88.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.88.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.88.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.88.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.88.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.88.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.89.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.89.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.89.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.89.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.89.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.89.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.9.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.9.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.9.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.9.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.9.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.9.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.90.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.90.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.90.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.90.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.90.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.90.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.91.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.91.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.91.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.91.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.91.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.91.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.92.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.92.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.92.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.92.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.92.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.92.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.93.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.93.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.93.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.93.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.93.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.93.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.94.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.94.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.94.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.94.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.94.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.94.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.95.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.95.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.95.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.95.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.95.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.95.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.96.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.96.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.96.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.96.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.96.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.96.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.97.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.97.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.97.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.97.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.97.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.97.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.98.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.98.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.98.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.98.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.98.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.98.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.99.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.99.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.99.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.99.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.99.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.experts.99.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.gate.e_score_correction_bias": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.gate.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.shared_experts.down_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.shared_experts.down_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.shared_experts.gate_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.shared_experts.gate_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.shared_experts.up_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.mlp.shared_experts.up_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.post_attention_layernorm.weight": "model-00062-of-00092.safetensors", + "model.layers.61.self_attn.k_norm.weight": "model-00062-of-00092.safetensors", + "model.layers.61.self_attn.k_proj.bias": "model-00062-of-00092.safetensors", + "model.layers.61.self_attn.k_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.self_attn.k_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.self_attn.o_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.self_attn.o_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.self_attn.q_norm.weight": "model-00062-of-00092.safetensors", + "model.layers.61.self_attn.q_proj.bias": "model-00062-of-00092.safetensors", + "model.layers.61.self_attn.q_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.self_attn.q_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.61.self_attn.v_proj.bias": "model-00062-of-00092.safetensors", + "model.layers.61.self_attn.v_proj.weight": "model-00062-of-00092.safetensors", + "model.layers.61.self_attn.v_proj.weight_scale": "model-00062-of-00092.safetensors", + "model.layers.62.input_layernorm.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.0.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.0.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.0.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.0.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.0.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.0.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.1.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.1.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.1.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.1.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.1.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.1.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.10.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.10.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.10.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.10.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.10.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.10.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.100.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.100.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.100.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.100.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.100.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.100.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.101.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.101.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.101.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.101.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.101.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.101.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.102.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.102.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.102.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.102.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.102.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.102.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.103.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.103.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.103.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.103.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.103.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.103.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.104.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.104.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.104.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.104.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.104.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.104.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.105.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.105.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.105.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.105.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.105.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.105.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.106.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.106.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.106.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.106.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.106.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.106.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.107.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.107.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.107.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.107.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.107.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.107.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.108.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.108.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.108.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.108.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.108.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.108.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.109.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.109.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.109.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.109.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.109.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.109.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.11.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.11.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.11.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.11.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.11.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.11.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.110.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.110.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.110.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.110.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.110.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.110.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.111.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.111.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.111.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.111.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.111.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.111.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.112.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.112.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.112.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.112.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.112.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.112.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.113.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.113.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.113.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.113.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.113.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.113.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.114.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.114.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.114.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.114.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.114.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.114.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.115.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.115.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.115.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.115.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.115.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.115.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.116.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.116.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.116.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.116.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.116.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.116.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.117.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.117.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.117.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.117.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.117.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.117.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.118.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.118.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.118.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.118.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.118.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.118.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.119.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.119.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.119.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.119.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.119.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.119.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.12.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.12.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.12.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.12.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.12.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.12.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.120.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.120.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.120.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.120.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.120.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.120.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.121.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.121.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.121.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.121.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.121.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.121.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.122.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.122.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.122.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.122.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.122.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.122.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.123.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.123.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.123.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.123.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.123.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.123.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.124.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.124.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.124.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.124.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.124.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.124.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.125.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.125.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.125.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.125.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.125.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.125.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.126.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.126.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.126.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.126.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.126.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.126.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.127.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.127.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.127.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.127.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.127.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.127.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.128.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.128.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.128.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.128.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.128.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.128.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.129.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.129.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.129.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.129.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.129.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.129.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.13.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.13.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.13.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.13.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.13.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.13.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.130.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.130.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.130.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.130.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.130.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.130.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.131.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.131.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.131.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.131.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.131.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.131.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.132.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.132.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.132.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.132.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.132.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.132.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.133.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.133.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.133.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.133.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.133.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.133.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.134.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.134.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.134.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.134.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.134.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.134.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.135.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.135.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.135.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.135.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.135.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.135.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.136.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.136.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.136.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.136.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.136.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.136.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.137.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.137.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.137.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.137.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.137.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.137.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.138.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.138.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.138.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.138.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.138.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.138.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.139.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.139.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.139.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.139.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.139.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.139.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.14.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.14.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.14.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.14.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.14.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.14.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.140.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.140.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.140.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.140.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.140.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.140.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.141.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.141.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.141.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.141.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.141.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.141.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.142.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.142.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.142.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.142.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.142.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.142.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.143.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.143.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.143.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.143.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.143.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.143.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.144.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.144.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.144.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.144.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.144.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.144.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.145.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.145.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.145.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.145.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.145.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.145.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.146.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.146.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.146.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.146.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.146.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.146.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.147.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.147.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.147.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.147.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.147.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.147.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.148.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.148.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.148.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.148.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.148.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.148.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.149.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.149.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.149.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.149.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.149.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.149.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.15.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.15.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.15.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.15.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.15.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.15.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.150.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.150.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.150.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.150.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.150.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.150.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.151.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.151.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.151.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.151.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.151.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.151.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.152.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.152.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.152.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.152.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.152.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.152.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.153.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.153.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.153.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.153.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.153.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.153.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.154.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.154.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.154.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.154.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.154.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.154.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.155.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.155.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.155.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.155.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.155.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.155.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.156.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.156.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.156.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.156.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.156.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.156.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.157.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.157.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.157.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.157.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.157.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.157.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.158.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.158.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.158.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.158.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.158.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.158.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.159.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.159.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.159.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.159.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.159.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.159.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.16.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.16.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.16.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.16.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.16.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.16.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.17.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.17.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.17.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.17.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.17.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.17.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.18.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.18.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.18.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.18.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.18.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.18.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.19.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.19.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.19.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.19.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.19.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.19.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.2.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.2.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.2.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.2.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.2.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.2.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.20.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.20.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.20.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.20.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.20.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.20.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.21.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.21.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.21.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.21.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.21.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.21.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.22.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.22.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.22.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.22.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.22.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.22.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.23.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.23.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.23.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.23.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.23.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.23.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.24.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.24.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.24.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.24.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.24.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.24.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.25.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.25.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.25.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.25.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.25.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.25.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.26.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.26.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.26.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.26.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.26.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.26.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.27.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.27.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.27.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.27.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.27.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.27.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.28.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.28.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.28.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.28.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.28.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.28.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.29.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.29.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.29.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.29.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.29.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.29.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.3.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.3.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.3.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.3.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.3.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.3.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.30.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.30.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.30.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.30.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.30.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.30.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.31.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.31.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.31.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.31.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.31.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.31.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.32.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.32.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.32.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.32.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.32.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.32.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.33.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.33.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.33.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.33.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.33.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.33.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.34.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.34.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.34.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.34.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.34.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.34.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.35.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.35.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.35.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.35.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.35.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.35.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.36.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.36.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.36.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.36.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.36.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.36.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.37.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.37.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.37.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.37.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.37.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.37.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.38.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.38.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.38.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.38.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.38.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.38.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.39.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.39.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.39.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.39.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.39.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.39.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.4.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.4.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.4.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.4.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.4.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.4.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.40.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.40.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.40.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.40.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.40.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.40.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.41.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.41.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.41.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.41.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.41.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.41.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.42.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.42.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.42.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.42.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.42.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.42.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.43.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.43.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.43.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.43.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.43.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.43.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.44.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.44.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.44.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.44.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.44.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.44.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.45.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.45.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.45.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.45.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.45.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.45.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.46.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.46.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.46.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.46.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.46.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.46.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.47.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.47.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.47.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.47.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.47.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.47.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.48.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.48.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.48.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.48.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.48.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.48.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.49.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.49.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.49.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.49.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.49.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.49.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.5.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.5.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.5.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.5.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.5.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.5.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.50.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.50.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.50.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.50.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.50.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.50.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.51.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.51.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.51.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.51.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.51.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.51.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.52.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.52.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.52.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.52.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.52.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.52.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.53.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.53.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.53.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.53.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.53.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.53.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.54.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.54.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.54.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.54.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.54.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.54.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.55.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.55.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.55.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.55.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.55.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.55.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.56.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.56.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.56.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.56.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.56.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.56.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.57.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.57.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.57.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.57.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.57.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.57.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.58.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.58.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.58.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.58.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.58.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.58.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.59.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.59.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.59.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.59.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.59.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.59.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.6.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.6.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.6.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.6.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.6.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.6.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.60.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.60.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.60.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.60.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.60.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.60.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.61.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.61.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.61.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.61.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.61.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.61.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.62.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.62.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.62.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.62.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.62.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.62.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.63.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.63.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.63.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.63.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.63.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.63.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.64.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.64.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.64.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.64.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.64.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.64.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.65.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.65.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.65.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.65.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.65.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.65.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.66.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.66.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.66.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.66.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.66.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.66.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.67.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.67.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.67.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.67.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.67.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.67.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.68.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.68.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.68.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.68.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.68.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.68.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.69.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.69.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.69.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.69.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.69.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.69.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.7.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.7.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.7.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.7.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.7.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.7.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.70.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.70.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.70.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.70.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.70.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.70.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.71.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.71.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.71.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.71.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.71.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.71.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.72.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.72.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.72.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.72.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.72.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.72.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.73.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.73.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.73.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.73.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.73.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.73.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.74.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.74.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.74.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.74.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.74.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.74.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.75.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.75.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.75.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.75.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.75.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.75.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.76.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.76.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.76.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.76.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.76.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.76.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.77.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.77.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.77.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.77.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.77.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.77.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.78.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.78.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.78.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.78.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.78.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.78.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.79.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.79.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.79.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.79.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.79.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.79.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.8.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.8.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.8.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.8.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.8.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.8.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.80.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.80.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.80.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.80.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.80.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.80.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.81.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.81.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.81.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.81.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.81.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.81.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.82.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.82.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.82.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.82.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.82.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.82.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.83.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.83.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.83.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.83.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.83.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.83.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.84.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.84.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.84.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.84.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.84.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.84.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.85.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.85.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.85.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.85.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.85.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.85.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.86.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.86.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.86.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.86.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.86.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.86.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.87.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.87.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.87.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.87.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.87.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.87.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.88.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.88.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.88.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.88.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.88.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.88.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.89.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.89.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.89.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.89.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.89.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.89.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.9.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.9.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.9.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.9.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.9.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.9.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.90.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.90.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.90.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.90.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.90.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.90.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.91.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.91.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.91.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.91.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.91.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.91.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.92.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.92.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.92.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.92.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.92.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.92.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.93.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.93.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.93.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.93.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.93.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.93.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.94.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.94.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.94.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.94.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.94.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.94.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.95.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.95.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.95.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.95.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.95.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.95.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.96.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.96.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.96.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.96.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.96.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.96.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.97.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.97.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.97.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.97.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.97.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.97.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.98.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.98.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.98.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.98.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.98.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.98.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.99.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.99.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.99.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.99.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.99.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.experts.99.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.gate.e_score_correction_bias": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.gate.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.shared_experts.down_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.shared_experts.down_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.shared_experts.gate_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.shared_experts.gate_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.shared_experts.up_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.mlp.shared_experts.up_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.post_attention_layernorm.weight": "model-00063-of-00092.safetensors", + "model.layers.62.self_attn.k_norm.weight": "model-00063-of-00092.safetensors", + "model.layers.62.self_attn.k_proj.bias": "model-00063-of-00092.safetensors", + "model.layers.62.self_attn.k_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.self_attn.k_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.self_attn.o_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.self_attn.o_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.self_attn.q_norm.weight": "model-00063-of-00092.safetensors", + "model.layers.62.self_attn.q_proj.bias": "model-00063-of-00092.safetensors", + "model.layers.62.self_attn.q_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.self_attn.q_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.62.self_attn.v_proj.bias": "model-00063-of-00092.safetensors", + "model.layers.62.self_attn.v_proj.weight": "model-00063-of-00092.safetensors", + "model.layers.62.self_attn.v_proj.weight_scale": "model-00063-of-00092.safetensors", + "model.layers.63.input_layernorm.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.0.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.0.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.0.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.0.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.0.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.0.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.1.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.1.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.1.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.1.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.1.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.1.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.10.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.10.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.10.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.10.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.10.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.10.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.100.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.100.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.100.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.100.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.100.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.100.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.101.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.101.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.101.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.101.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.101.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.101.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.102.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.102.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.102.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.102.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.102.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.102.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.103.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.103.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.103.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.103.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.103.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.103.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.104.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.104.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.104.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.104.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.104.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.104.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.105.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.105.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.105.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.105.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.105.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.105.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.106.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.106.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.106.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.106.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.106.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.106.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.107.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.107.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.107.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.107.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.107.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.107.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.108.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.108.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.108.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.108.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.108.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.108.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.109.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.109.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.109.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.109.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.109.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.109.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.11.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.11.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.11.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.11.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.11.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.11.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.110.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.110.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.110.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.110.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.110.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.110.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.111.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.111.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.111.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.111.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.111.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.111.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.112.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.112.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.112.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.112.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.112.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.112.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.113.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.113.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.113.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.113.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.113.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.113.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.114.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.114.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.114.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.114.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.114.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.114.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.115.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.115.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.115.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.115.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.115.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.115.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.116.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.116.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.116.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.116.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.116.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.116.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.117.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.117.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.117.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.117.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.117.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.117.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.118.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.118.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.118.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.118.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.118.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.118.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.119.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.119.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.119.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.119.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.119.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.119.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.12.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.12.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.12.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.12.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.12.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.12.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.120.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.120.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.120.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.120.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.120.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.120.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.121.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.121.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.121.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.121.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.121.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.121.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.122.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.122.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.122.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.122.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.122.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.122.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.123.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.123.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.123.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.123.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.123.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.123.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.124.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.124.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.124.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.124.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.124.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.124.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.125.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.125.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.125.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.125.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.125.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.125.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.126.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.126.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.126.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.126.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.126.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.126.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.127.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.127.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.127.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.127.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.127.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.127.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.128.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.128.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.128.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.128.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.128.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.128.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.129.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.129.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.129.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.129.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.129.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.129.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.13.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.13.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.13.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.13.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.13.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.13.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.130.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.130.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.130.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.130.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.130.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.130.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.131.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.131.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.131.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.131.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.131.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.131.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.132.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.132.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.132.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.132.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.132.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.132.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.133.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.133.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.133.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.133.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.133.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.133.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.134.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.134.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.134.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.134.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.134.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.134.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.135.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.135.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.135.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.135.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.135.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.135.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.136.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.136.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.136.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.136.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.136.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.136.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.137.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.137.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.137.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.137.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.137.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.137.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.138.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.138.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.138.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.138.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.138.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.138.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.139.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.139.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.139.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.139.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.139.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.139.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.14.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.14.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.14.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.14.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.14.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.14.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.140.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.140.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.140.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.140.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.140.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.140.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.141.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.141.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.141.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.141.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.141.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.141.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.142.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.142.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.142.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.142.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.142.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.142.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.143.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.143.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.143.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.143.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.143.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.143.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.144.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.144.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.144.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.144.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.144.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.144.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.145.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.145.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.145.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.145.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.145.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.145.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.146.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.146.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.146.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.146.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.146.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.146.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.147.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.147.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.147.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.147.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.147.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.147.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.148.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.148.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.148.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.148.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.148.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.148.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.149.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.149.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.149.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.149.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.149.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.149.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.15.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.15.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.15.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.15.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.15.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.15.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.150.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.150.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.150.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.150.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.150.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.150.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.151.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.151.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.151.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.151.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.151.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.151.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.152.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.152.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.152.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.152.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.152.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.152.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.153.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.153.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.153.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.153.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.153.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.153.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.154.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.154.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.154.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.154.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.154.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.154.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.155.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.155.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.155.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.155.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.155.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.155.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.156.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.156.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.156.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.156.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.156.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.156.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.157.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.157.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.157.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.157.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.157.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.157.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.158.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.158.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.158.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.158.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.158.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.158.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.159.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.159.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.159.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.159.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.159.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.159.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.16.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.16.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.16.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.16.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.16.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.16.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.17.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.17.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.17.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.17.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.17.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.17.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.18.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.18.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.18.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.18.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.18.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.18.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.19.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.19.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.19.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.19.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.19.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.19.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.2.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.2.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.2.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.2.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.2.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.2.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.20.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.20.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.20.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.20.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.20.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.20.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.21.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.21.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.21.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.21.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.21.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.21.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.22.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.22.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.22.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.22.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.22.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.22.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.23.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.23.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.23.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.23.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.23.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.23.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.24.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.24.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.24.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.24.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.24.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.24.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.25.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.25.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.25.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.25.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.25.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.25.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.26.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.26.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.26.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.26.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.26.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.26.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.27.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.27.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.27.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.27.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.27.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.27.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.28.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.28.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.28.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.28.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.28.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.28.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.29.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.29.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.29.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.29.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.29.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.29.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.3.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.3.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.3.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.3.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.3.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.3.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.30.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.30.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.30.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.30.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.30.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.30.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.31.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.31.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.31.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.31.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.31.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.31.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.32.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.32.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.32.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.32.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.32.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.32.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.33.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.33.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.33.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.33.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.33.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.33.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.34.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.34.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.34.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.34.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.34.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.34.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.35.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.35.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.35.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.35.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.35.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.35.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.36.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.36.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.36.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.36.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.36.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.36.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.37.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.37.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.37.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.37.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.37.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.37.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.38.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.38.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.38.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.38.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.38.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.38.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.39.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.39.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.39.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.39.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.39.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.39.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.4.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.4.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.4.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.4.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.4.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.4.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.40.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.40.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.40.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.40.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.40.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.40.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.41.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.41.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.41.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.41.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.41.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.41.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.42.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.42.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.42.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.42.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.42.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.42.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.43.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.43.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.43.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.43.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.43.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.43.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.44.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.44.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.44.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.44.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.44.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.44.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.45.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.45.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.45.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.45.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.45.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.45.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.46.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.46.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.46.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.46.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.46.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.46.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.47.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.47.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.47.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.47.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.47.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.47.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.48.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.48.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.48.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.48.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.48.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.48.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.49.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.49.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.49.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.49.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.49.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.49.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.5.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.5.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.5.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.5.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.5.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.5.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.50.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.50.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.50.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.50.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.50.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.50.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.51.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.51.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.51.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.51.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.51.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.51.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.52.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.52.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.52.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.52.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.52.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.52.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.53.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.53.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.53.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.53.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.53.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.53.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.54.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.54.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.54.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.54.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.54.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.54.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.55.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.55.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.55.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.55.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.55.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.55.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.56.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.56.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.56.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.56.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.56.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.56.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.57.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.57.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.57.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.57.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.57.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.57.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.58.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.58.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.58.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.58.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.58.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.58.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.59.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.59.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.59.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.59.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.59.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.59.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.6.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.6.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.6.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.6.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.6.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.6.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.60.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.60.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.60.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.60.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.60.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.60.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.61.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.61.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.61.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.61.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.61.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.61.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.62.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.62.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.62.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.62.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.62.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.62.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.63.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.63.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.63.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.63.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.63.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.63.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.64.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.64.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.64.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.64.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.64.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.64.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.65.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.65.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.65.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.65.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.65.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.65.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.66.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.66.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.66.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.66.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.66.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.66.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.67.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.67.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.67.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.67.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.67.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.67.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.68.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.68.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.68.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.68.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.68.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.68.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.69.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.69.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.69.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.69.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.69.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.69.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.7.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.7.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.7.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.7.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.7.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.7.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.70.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.70.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.70.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.70.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.70.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.70.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.71.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.71.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.71.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.71.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.71.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.71.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.72.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.72.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.72.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.72.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.72.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.72.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.73.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.73.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.73.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.73.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.73.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.73.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.74.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.74.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.74.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.74.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.74.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.74.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.75.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.75.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.75.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.75.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.75.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.75.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.76.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.76.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.76.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.76.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.76.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.76.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.77.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.77.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.77.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.77.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.77.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.77.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.78.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.78.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.78.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.78.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.78.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.78.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.79.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.79.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.79.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.79.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.79.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.79.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.8.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.8.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.8.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.8.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.8.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.8.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.80.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.80.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.80.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.80.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.80.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.80.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.81.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.81.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.81.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.81.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.81.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.81.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.82.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.82.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.82.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.82.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.82.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.82.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.83.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.83.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.83.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.83.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.83.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.83.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.84.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.84.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.84.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.84.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.84.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.84.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.85.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.85.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.85.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.85.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.85.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.85.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.86.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.86.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.86.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.86.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.86.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.86.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.87.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.87.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.87.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.87.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.87.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.87.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.88.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.88.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.88.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.88.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.88.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.88.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.89.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.89.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.89.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.89.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.89.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.89.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.9.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.9.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.9.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.9.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.9.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.9.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.90.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.90.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.90.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.90.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.90.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.90.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.91.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.91.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.91.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.91.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.91.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.91.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.92.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.92.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.92.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.92.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.92.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.92.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.93.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.93.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.93.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.93.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.93.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.93.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.94.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.94.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.94.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.94.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.94.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.94.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.95.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.95.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.95.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.95.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.95.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.95.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.96.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.96.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.96.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.96.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.96.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.96.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.97.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.97.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.97.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.97.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.97.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.97.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.98.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.98.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.98.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.98.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.98.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.98.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.99.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.99.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.99.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.99.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.99.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.experts.99.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.gate.e_score_correction_bias": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.gate.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.shared_experts.down_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.shared_experts.down_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.shared_experts.gate_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.shared_experts.gate_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.shared_experts.up_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.mlp.shared_experts.up_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.post_attention_layernorm.weight": "model-00064-of-00092.safetensors", + "model.layers.63.self_attn.k_norm.weight": "model-00064-of-00092.safetensors", + "model.layers.63.self_attn.k_proj.bias": "model-00064-of-00092.safetensors", + "model.layers.63.self_attn.k_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.self_attn.k_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.self_attn.o_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.self_attn.o_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.self_attn.q_norm.weight": "model-00064-of-00092.safetensors", + "model.layers.63.self_attn.q_proj.bias": "model-00064-of-00092.safetensors", + "model.layers.63.self_attn.q_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.self_attn.q_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.63.self_attn.v_proj.bias": "model-00064-of-00092.safetensors", + "model.layers.63.self_attn.v_proj.weight": "model-00064-of-00092.safetensors", + "model.layers.63.self_attn.v_proj.weight_scale": "model-00064-of-00092.safetensors", + "model.layers.64.input_layernorm.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.0.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.0.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.0.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.0.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.0.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.0.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.1.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.1.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.1.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.1.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.1.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.1.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.10.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.10.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.10.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.10.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.10.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.10.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.100.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.100.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.100.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.100.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.100.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.100.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.101.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.101.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.101.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.101.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.101.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.101.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.102.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.102.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.102.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.102.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.102.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.102.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.103.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.103.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.103.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.103.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.103.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.103.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.104.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.104.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.104.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.104.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.104.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.104.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.105.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.105.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.105.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.105.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.105.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.105.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.106.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.106.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.106.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.106.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.106.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.106.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.107.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.107.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.107.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.107.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.107.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.107.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.108.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.108.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.108.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.108.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.108.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.108.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.109.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.109.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.109.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.109.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.109.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.109.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.11.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.11.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.11.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.11.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.11.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.11.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.110.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.110.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.110.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.110.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.110.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.110.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.111.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.111.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.111.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.111.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.111.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.111.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.112.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.112.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.112.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.112.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.112.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.112.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.113.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.113.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.113.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.113.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.113.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.113.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.114.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.114.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.114.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.114.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.114.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.114.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.115.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.115.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.115.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.115.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.115.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.115.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.116.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.116.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.116.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.116.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.116.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.116.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.117.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.117.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.117.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.117.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.117.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.117.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.118.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.118.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.118.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.118.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.118.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.118.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.119.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.119.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.119.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.119.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.119.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.119.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.12.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.12.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.12.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.12.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.12.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.12.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.120.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.120.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.120.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.120.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.120.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.120.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.121.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.121.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.121.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.121.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.121.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.121.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.122.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.122.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.122.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.122.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.122.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.122.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.123.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.123.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.123.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.123.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.123.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.123.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.124.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.124.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.124.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.124.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.124.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.124.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.125.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.125.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.125.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.125.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.125.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.125.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.126.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.126.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.126.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.126.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.126.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.126.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.127.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.127.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.127.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.127.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.127.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.127.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.128.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.128.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.128.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.128.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.128.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.128.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.129.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.129.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.129.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.129.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.129.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.129.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.13.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.13.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.13.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.13.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.13.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.13.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.130.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.130.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.130.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.130.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.130.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.130.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.131.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.131.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.131.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.131.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.131.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.131.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.132.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.132.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.132.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.132.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.132.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.132.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.133.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.133.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.133.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.133.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.133.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.133.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.134.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.134.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.134.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.134.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.134.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.134.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.135.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.135.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.135.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.135.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.135.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.135.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.136.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.136.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.136.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.136.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.136.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.136.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.137.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.137.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.137.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.137.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.137.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.137.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.138.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.138.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.138.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.138.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.138.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.138.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.139.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.139.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.139.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.139.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.139.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.139.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.14.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.14.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.14.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.14.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.14.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.14.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.140.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.140.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.140.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.140.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.140.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.140.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.141.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.141.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.141.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.141.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.141.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.141.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.142.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.142.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.142.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.142.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.142.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.142.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.143.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.143.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.143.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.143.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.143.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.143.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.144.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.144.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.144.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.144.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.144.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.144.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.145.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.145.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.145.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.145.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.145.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.145.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.146.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.146.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.146.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.146.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.146.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.146.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.147.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.147.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.147.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.147.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.147.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.147.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.148.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.148.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.148.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.148.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.148.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.148.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.149.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.149.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.149.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.149.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.149.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.149.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.15.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.15.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.15.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.15.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.15.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.15.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.150.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.150.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.150.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.150.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.150.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.150.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.151.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.151.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.151.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.151.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.151.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.151.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.152.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.152.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.152.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.152.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.152.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.152.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.153.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.153.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.153.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.153.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.153.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.153.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.154.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.154.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.154.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.154.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.154.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.154.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.155.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.155.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.155.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.155.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.155.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.155.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.156.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.156.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.156.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.156.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.156.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.156.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.157.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.157.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.157.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.157.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.157.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.157.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.158.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.158.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.158.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.158.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.158.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.158.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.159.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.159.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.159.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.159.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.159.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.159.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.16.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.16.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.16.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.16.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.16.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.16.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.17.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.17.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.17.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.17.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.17.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.17.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.18.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.18.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.18.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.18.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.18.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.18.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.19.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.19.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.19.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.19.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.19.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.19.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.2.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.2.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.2.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.2.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.2.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.2.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.20.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.20.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.20.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.20.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.20.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.20.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.21.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.21.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.21.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.21.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.21.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.21.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.22.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.22.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.22.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.22.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.22.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.22.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.23.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.23.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.23.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.23.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.23.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.23.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.24.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.24.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.24.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.24.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.24.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.24.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.25.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.25.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.25.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.25.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.25.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.25.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.26.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.26.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.26.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.26.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.26.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.26.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.27.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.27.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.27.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.27.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.27.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.27.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.28.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.28.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.28.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.28.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.28.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.28.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.29.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.29.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.29.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.29.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.29.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.29.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.3.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.3.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.3.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.3.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.3.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.3.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.30.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.30.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.30.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.30.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.30.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.30.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.31.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.31.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.31.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.31.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.31.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.31.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.32.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.32.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.32.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.32.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.32.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.32.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.33.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.33.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.33.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.33.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.33.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.33.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.34.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.34.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.34.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.34.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.34.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.34.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.35.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.35.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.35.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.35.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.35.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.35.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.36.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.36.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.36.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.36.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.36.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.36.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.37.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.37.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.37.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.37.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.37.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.37.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.38.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.38.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.38.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.38.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.38.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.38.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.39.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.39.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.39.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.39.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.39.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.39.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.4.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.4.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.4.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.4.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.4.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.4.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.40.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.40.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.40.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.40.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.40.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.40.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.41.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.41.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.41.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.41.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.41.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.41.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.42.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.42.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.42.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.42.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.42.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.42.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.43.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.43.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.43.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.43.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.43.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.43.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.44.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.44.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.44.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.44.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.44.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.44.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.45.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.45.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.45.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.45.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.45.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.45.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.46.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.46.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.46.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.46.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.46.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.46.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.47.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.47.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.47.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.47.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.47.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.47.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.48.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.48.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.48.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.48.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.48.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.48.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.49.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.49.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.49.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.49.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.49.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.49.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.5.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.5.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.5.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.5.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.5.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.5.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.50.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.50.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.50.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.50.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.50.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.50.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.51.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.51.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.51.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.51.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.51.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.51.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.52.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.52.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.52.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.52.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.52.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.52.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.53.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.53.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.53.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.53.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.53.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.53.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.54.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.54.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.54.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.54.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.54.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.54.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.55.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.55.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.55.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.55.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.55.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.55.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.56.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.56.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.56.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.56.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.56.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.56.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.57.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.57.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.57.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.57.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.57.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.57.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.58.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.58.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.58.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.58.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.58.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.58.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.59.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.59.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.59.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.59.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.59.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.59.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.6.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.6.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.6.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.6.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.6.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.6.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.60.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.60.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.60.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.60.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.60.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.60.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.61.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.61.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.61.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.61.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.61.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.61.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.62.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.62.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.62.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.62.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.62.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.62.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.63.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.63.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.63.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.63.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.63.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.63.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.64.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.64.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.64.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.64.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.64.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.64.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.65.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.65.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.65.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.65.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.65.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.65.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.66.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.66.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.66.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.66.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.66.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.66.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.67.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.67.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.67.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.67.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.67.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.67.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.68.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.68.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.68.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.68.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.68.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.68.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.69.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.69.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.69.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.69.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.69.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.69.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.7.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.7.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.7.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.7.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.7.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.7.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.70.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.70.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.70.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.70.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.70.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.70.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.71.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.71.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.71.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.71.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.71.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.71.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.72.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.72.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.72.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.72.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.72.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.72.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.73.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.73.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.73.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.73.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.73.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.73.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.74.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.74.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.74.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.74.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.74.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.74.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.75.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.75.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.75.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.75.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.75.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.75.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.76.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.76.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.76.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.76.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.76.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.76.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.77.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.77.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.77.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.77.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.77.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.77.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.78.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.78.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.78.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.78.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.78.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.78.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.79.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.79.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.79.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.79.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.79.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.79.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.8.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.8.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.8.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.8.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.8.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.8.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.80.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.80.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.80.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.80.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.80.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.80.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.81.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.81.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.81.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.81.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.81.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.81.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.82.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.82.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.82.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.82.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.82.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.82.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.83.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.83.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.83.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.83.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.83.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.83.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.84.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.84.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.84.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.84.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.84.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.84.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.85.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.85.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.85.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.85.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.85.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.85.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.86.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.86.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.86.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.86.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.86.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.86.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.87.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.87.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.87.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.87.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.87.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.87.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.88.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.88.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.88.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.88.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.88.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.88.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.89.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.89.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.89.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.89.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.89.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.89.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.9.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.9.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.9.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.9.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.9.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.9.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.90.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.90.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.90.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.90.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.90.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.90.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.91.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.91.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.91.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.91.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.91.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.91.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.92.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.92.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.92.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.92.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.92.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.92.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.93.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.93.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.93.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.93.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.93.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.93.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.94.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.94.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.94.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.94.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.94.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.94.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.95.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.95.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.95.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.95.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.95.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.95.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.96.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.96.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.96.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.96.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.96.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.96.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.97.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.97.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.97.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.97.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.97.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.97.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.98.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.98.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.98.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.98.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.98.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.98.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.99.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.99.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.99.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.99.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.99.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.experts.99.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.gate.e_score_correction_bias": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.gate.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.shared_experts.down_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.shared_experts.down_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.shared_experts.gate_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.shared_experts.gate_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.shared_experts.up_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.mlp.shared_experts.up_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.post_attention_layernorm.weight": "model-00065-of-00092.safetensors", + "model.layers.64.self_attn.k_norm.weight": "model-00065-of-00092.safetensors", + "model.layers.64.self_attn.k_proj.bias": "model-00065-of-00092.safetensors", + "model.layers.64.self_attn.k_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.self_attn.k_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.self_attn.o_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.self_attn.o_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.self_attn.q_norm.weight": "model-00065-of-00092.safetensors", + "model.layers.64.self_attn.q_proj.bias": "model-00065-of-00092.safetensors", + "model.layers.64.self_attn.q_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.self_attn.q_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.64.self_attn.v_proj.bias": "model-00065-of-00092.safetensors", + "model.layers.64.self_attn.v_proj.weight": "model-00065-of-00092.safetensors", + "model.layers.64.self_attn.v_proj.weight_scale": "model-00065-of-00092.safetensors", + "model.layers.65.input_layernorm.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.0.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.0.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.0.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.0.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.0.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.0.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.1.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.1.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.1.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.1.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.1.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.1.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.10.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.10.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.10.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.10.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.10.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.10.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.100.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.100.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.100.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.100.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.100.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.100.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.101.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.101.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.101.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.101.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.101.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.101.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.102.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.102.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.102.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.102.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.102.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.102.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.103.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.103.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.103.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.103.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.103.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.103.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.104.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.104.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.104.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.104.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.104.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.104.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.105.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.105.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.105.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.105.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.105.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.105.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.106.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.106.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.106.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.106.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.106.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.106.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.107.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.107.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.107.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.107.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.107.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.107.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.108.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.108.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.108.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.108.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.108.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.108.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.109.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.109.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.109.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.109.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.109.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.109.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.11.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.11.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.11.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.11.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.11.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.11.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.110.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.110.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.110.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.110.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.110.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.110.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.111.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.111.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.111.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.111.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.111.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.111.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.112.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.112.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.112.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.112.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.112.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.112.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.113.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.113.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.113.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.113.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.113.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.113.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.114.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.114.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.114.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.114.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.114.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.114.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.115.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.115.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.115.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.115.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.115.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.115.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.116.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.116.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.116.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.116.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.116.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.116.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.117.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.117.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.117.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.117.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.117.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.117.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.118.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.118.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.118.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.118.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.118.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.118.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.119.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.119.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.119.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.119.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.119.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.119.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.12.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.12.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.12.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.12.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.12.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.12.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.120.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.120.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.120.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.120.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.120.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.120.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.121.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.121.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.121.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.121.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.121.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.121.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.122.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.122.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.122.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.122.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.122.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.122.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.123.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.123.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.123.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.123.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.123.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.123.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.124.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.124.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.124.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.124.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.124.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.124.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.125.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.125.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.125.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.125.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.125.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.125.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.126.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.126.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.126.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.126.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.126.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.126.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.127.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.127.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.127.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.127.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.127.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.127.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.128.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.128.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.128.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.128.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.128.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.128.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.129.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.129.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.129.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.129.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.129.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.129.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.13.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.13.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.13.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.13.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.13.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.13.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.130.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.130.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.130.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.130.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.130.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.130.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.131.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.131.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.131.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.131.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.131.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.131.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.132.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.132.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.132.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.132.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.132.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.132.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.133.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.133.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.133.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.133.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.133.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.133.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.134.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.134.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.134.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.134.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.134.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.134.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.135.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.135.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.135.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.135.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.135.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.135.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.136.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.136.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.136.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.136.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.136.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.136.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.137.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.137.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.137.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.137.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.137.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.137.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.138.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.138.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.138.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.138.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.138.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.138.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.139.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.139.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.139.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.139.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.139.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.139.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.14.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.14.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.14.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.14.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.14.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.14.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.140.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.140.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.140.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.140.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.140.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.140.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.141.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.141.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.141.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.141.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.141.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.141.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.142.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.142.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.142.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.142.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.142.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.142.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.143.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.143.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.143.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.143.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.143.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.143.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.144.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.144.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.144.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.144.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.144.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.144.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.145.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.145.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.145.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.145.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.145.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.145.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.146.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.146.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.146.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.146.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.146.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.146.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.147.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.147.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.147.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.147.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.147.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.147.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.148.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.148.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.148.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.148.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.148.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.148.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.149.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.149.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.149.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.149.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.149.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.149.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.15.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.15.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.15.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.15.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.15.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.15.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.150.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.150.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.150.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.150.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.150.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.150.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.151.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.151.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.151.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.151.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.151.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.151.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.152.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.152.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.152.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.152.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.152.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.152.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.153.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.153.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.153.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.153.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.153.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.153.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.154.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.154.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.154.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.154.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.154.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.154.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.155.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.155.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.155.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.155.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.155.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.155.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.156.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.156.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.156.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.156.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.156.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.156.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.157.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.157.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.157.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.157.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.157.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.157.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.158.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.158.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.158.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.158.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.158.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.158.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.159.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.159.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.159.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.159.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.159.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.159.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.16.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.16.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.16.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.16.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.16.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.16.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.17.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.17.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.17.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.17.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.17.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.17.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.18.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.18.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.18.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.18.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.18.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.18.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.19.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.19.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.19.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.19.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.19.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.19.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.2.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.2.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.2.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.2.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.2.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.2.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.20.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.20.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.20.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.20.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.20.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.20.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.21.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.21.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.21.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.21.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.21.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.21.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.22.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.22.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.22.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.22.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.22.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.22.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.23.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.23.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.23.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.23.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.23.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.23.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.24.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.24.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.24.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.24.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.24.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.24.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.25.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.25.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.25.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.25.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.25.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.25.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.26.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.26.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.26.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.26.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.26.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.26.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.27.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.27.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.27.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.27.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.27.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.27.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.28.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.28.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.28.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.28.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.28.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.28.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.29.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.29.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.29.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.29.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.29.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.29.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.3.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.3.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.3.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.3.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.3.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.3.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.30.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.30.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.30.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.30.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.30.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.30.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.31.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.31.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.31.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.31.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.31.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.31.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.32.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.32.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.32.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.32.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.32.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.32.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.33.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.33.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.33.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.33.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.33.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.33.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.34.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.34.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.34.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.34.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.34.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.34.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.35.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.35.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.35.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.35.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.35.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.35.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.36.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.36.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.36.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.36.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.36.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.36.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.37.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.37.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.37.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.37.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.37.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.37.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.38.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.38.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.38.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.38.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.38.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.38.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.39.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.39.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.39.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.39.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.39.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.39.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.4.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.4.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.4.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.4.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.4.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.4.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.40.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.40.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.40.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.40.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.40.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.40.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.41.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.41.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.41.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.41.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.41.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.41.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.42.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.42.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.42.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.42.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.42.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.42.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.43.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.43.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.43.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.43.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.43.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.43.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.44.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.44.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.44.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.44.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.44.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.44.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.45.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.45.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.45.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.45.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.45.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.45.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.46.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.46.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.46.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.46.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.46.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.46.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.47.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.47.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.47.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.47.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.47.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.47.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.48.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.48.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.48.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.48.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.48.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.48.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.49.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.49.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.49.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.49.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.49.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.49.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.5.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.5.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.5.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.5.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.5.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.5.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.50.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.50.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.50.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.50.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.50.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.50.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.51.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.51.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.51.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.51.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.51.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.51.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.52.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.52.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.52.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.52.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.52.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.52.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.53.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.53.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.53.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.53.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.53.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.53.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.54.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.54.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.54.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.54.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.54.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.54.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.55.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.55.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.55.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.55.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.55.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.55.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.56.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.56.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.56.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.56.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.56.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.56.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.57.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.57.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.57.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.57.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.57.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.57.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.58.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.58.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.58.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.58.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.58.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.58.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.59.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.59.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.59.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.59.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.59.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.59.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.6.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.6.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.6.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.6.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.6.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.6.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.60.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.60.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.60.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.60.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.60.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.60.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.61.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.61.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.61.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.61.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.61.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.61.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.62.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.62.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.62.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.62.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.62.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.62.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.63.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.63.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.63.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.63.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.63.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.63.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.64.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.64.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.64.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.64.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.64.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.64.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.65.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.65.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.65.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.65.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.65.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.65.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.66.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.66.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.66.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.66.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.66.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.66.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.67.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.67.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.67.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.67.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.67.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.67.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.68.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.68.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.68.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.68.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.68.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.68.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.69.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.69.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.69.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.69.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.69.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.69.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.7.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.7.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.7.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.7.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.7.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.7.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.70.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.70.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.70.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.70.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.70.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.70.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.71.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.71.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.71.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.71.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.71.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.71.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.72.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.72.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.72.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.72.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.72.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.72.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.73.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.73.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.73.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.73.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.73.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.73.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.74.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.74.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.74.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.74.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.74.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.74.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.75.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.75.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.75.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.75.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.75.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.75.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.76.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.76.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.76.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.76.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.76.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.76.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.77.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.77.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.77.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.77.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.77.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.77.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.78.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.78.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.78.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.78.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.78.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.78.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.79.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.79.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.79.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.79.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.79.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.79.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.8.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.8.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.8.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.8.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.8.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.8.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.80.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.80.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.80.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.80.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.80.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.80.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.81.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.81.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.81.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.81.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.81.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.81.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.82.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.82.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.82.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.82.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.82.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.82.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.83.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.83.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.83.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.83.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.83.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.83.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.84.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.84.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.84.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.84.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.84.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.84.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.85.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.85.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.85.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.85.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.85.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.85.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.86.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.86.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.86.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.86.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.86.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.86.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.87.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.87.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.87.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.87.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.87.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.87.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.88.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.88.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.88.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.88.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.88.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.88.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.89.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.89.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.89.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.89.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.89.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.89.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.9.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.9.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.9.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.9.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.9.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.9.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.90.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.90.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.90.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.90.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.90.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.90.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.91.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.91.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.91.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.91.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.91.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.91.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.92.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.92.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.92.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.92.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.92.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.92.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.93.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.93.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.93.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.93.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.93.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.93.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.94.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.94.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.94.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.94.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.94.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.94.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.95.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.95.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.95.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.95.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.95.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.95.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.96.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.96.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.96.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.96.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.96.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.96.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.97.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.97.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.97.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.97.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.97.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.97.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.98.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.98.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.98.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.98.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.98.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.98.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.99.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.99.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.99.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.99.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.99.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.experts.99.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.gate.e_score_correction_bias": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.gate.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.shared_experts.down_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.shared_experts.down_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.shared_experts.gate_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.shared_experts.gate_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.shared_experts.up_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.mlp.shared_experts.up_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.post_attention_layernorm.weight": "model-00066-of-00092.safetensors", + "model.layers.65.self_attn.k_norm.weight": "model-00066-of-00092.safetensors", + "model.layers.65.self_attn.k_proj.bias": "model-00066-of-00092.safetensors", + "model.layers.65.self_attn.k_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.self_attn.k_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.self_attn.o_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.self_attn.o_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.self_attn.q_norm.weight": "model-00066-of-00092.safetensors", + "model.layers.65.self_attn.q_proj.bias": "model-00066-of-00092.safetensors", + "model.layers.65.self_attn.q_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.self_attn.q_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.65.self_attn.v_proj.bias": "model-00066-of-00092.safetensors", + "model.layers.65.self_attn.v_proj.weight": "model-00066-of-00092.safetensors", + "model.layers.65.self_attn.v_proj.weight_scale": "model-00066-of-00092.safetensors", + "model.layers.66.input_layernorm.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.0.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.0.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.0.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.0.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.0.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.0.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.1.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.1.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.1.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.1.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.1.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.1.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.10.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.10.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.10.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.10.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.10.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.10.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.100.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.100.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.100.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.100.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.100.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.100.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.101.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.101.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.101.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.101.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.101.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.101.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.102.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.102.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.102.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.102.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.102.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.102.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.103.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.103.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.103.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.103.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.103.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.103.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.104.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.104.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.104.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.104.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.104.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.104.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.105.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.105.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.105.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.105.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.105.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.105.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.106.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.106.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.106.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.106.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.106.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.106.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.107.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.107.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.107.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.107.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.107.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.107.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.108.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.108.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.108.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.108.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.108.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.108.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.109.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.109.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.109.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.109.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.109.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.109.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.11.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.11.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.11.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.11.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.11.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.11.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.110.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.110.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.110.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.110.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.110.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.110.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.111.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.111.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.111.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.111.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.111.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.111.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.112.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.112.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.112.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.112.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.112.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.112.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.113.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.113.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.113.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.113.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.113.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.113.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.114.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.114.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.114.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.114.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.114.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.114.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.115.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.115.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.115.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.115.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.115.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.115.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.116.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.116.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.116.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.116.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.116.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.116.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.117.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.117.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.117.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.117.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.117.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.117.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.118.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.118.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.118.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.118.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.118.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.118.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.119.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.119.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.119.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.119.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.119.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.119.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.12.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.12.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.12.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.12.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.12.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.12.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.120.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.120.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.120.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.120.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.120.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.120.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.121.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.121.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.121.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.121.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.121.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.121.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.122.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.122.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.122.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.122.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.122.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.122.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.123.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.123.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.123.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.123.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.123.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.123.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.124.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.124.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.124.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.124.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.124.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.124.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.125.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.125.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.125.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.125.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.125.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.125.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.126.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.126.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.126.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.126.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.126.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.126.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.127.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.127.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.127.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.127.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.127.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.127.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.128.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.128.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.128.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.128.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.128.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.128.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.129.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.129.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.129.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.129.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.129.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.129.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.13.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.13.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.13.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.13.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.13.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.13.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.130.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.130.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.130.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.130.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.130.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.130.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.131.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.131.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.131.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.131.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.131.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.131.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.132.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.132.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.132.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.132.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.132.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.132.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.133.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.133.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.133.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.133.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.133.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.133.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.134.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.134.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.134.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.134.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.134.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.134.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.135.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.135.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.135.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.135.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.135.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.135.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.136.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.136.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.136.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.136.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.136.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.136.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.137.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.137.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.137.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.137.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.137.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.137.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.138.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.138.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.138.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.138.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.138.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.138.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.139.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.139.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.139.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.139.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.139.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.139.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.14.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.14.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.14.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.14.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.14.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.14.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.140.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.140.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.140.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.140.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.140.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.140.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.141.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.141.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.141.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.141.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.141.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.141.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.142.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.142.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.142.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.142.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.142.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.142.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.143.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.143.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.143.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.143.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.143.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.143.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.144.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.144.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.144.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.144.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.144.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.144.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.145.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.145.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.145.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.145.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.145.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.145.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.146.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.146.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.146.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.146.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.146.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.146.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.147.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.147.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.147.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.147.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.147.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.147.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.148.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.148.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.148.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.148.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.148.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.148.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.149.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.149.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.149.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.149.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.149.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.149.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.15.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.15.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.15.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.15.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.15.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.15.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.150.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.150.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.150.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.150.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.150.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.150.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.151.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.151.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.151.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.151.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.151.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.151.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.152.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.152.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.152.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.152.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.152.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.152.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.153.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.153.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.153.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.153.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.153.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.153.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.154.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.154.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.154.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.154.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.154.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.154.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.155.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.155.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.155.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.155.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.155.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.155.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.156.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.156.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.156.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.156.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.156.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.156.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.157.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.157.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.157.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.157.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.157.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.157.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.158.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.158.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.158.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.158.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.158.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.158.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.159.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.159.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.159.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.159.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.159.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.159.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.16.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.16.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.16.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.16.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.16.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.16.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.17.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.17.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.17.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.17.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.17.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.17.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.18.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.18.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.18.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.18.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.18.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.18.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.19.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.19.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.19.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.19.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.19.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.19.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.2.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.2.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.2.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.2.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.2.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.2.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.20.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.20.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.20.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.20.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.20.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.20.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.21.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.21.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.21.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.21.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.21.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.21.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.22.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.22.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.22.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.22.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.22.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.22.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.23.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.23.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.23.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.23.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.23.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.23.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.24.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.24.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.24.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.24.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.24.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.24.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.25.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.25.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.25.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.25.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.25.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.25.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.26.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.26.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.26.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.26.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.26.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.26.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.27.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.27.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.27.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.27.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.27.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.27.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.28.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.28.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.28.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.28.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.28.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.28.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.29.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.29.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.29.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.29.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.29.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.29.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.3.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.3.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.3.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.3.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.3.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.3.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.30.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.30.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.30.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.30.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.30.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.30.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.31.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.31.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.31.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.31.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.31.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.31.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.32.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.32.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.32.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.32.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.32.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.32.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.33.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.33.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.33.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.33.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.33.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.33.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.34.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.34.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.34.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.34.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.34.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.34.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.35.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.35.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.35.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.35.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.35.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.35.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.36.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.36.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.36.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.36.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.36.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.36.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.37.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.37.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.37.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.37.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.37.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.37.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.38.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.38.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.38.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.38.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.38.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.38.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.39.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.39.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.39.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.39.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.39.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.39.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.4.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.4.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.4.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.4.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.4.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.4.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.40.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.40.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.40.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.40.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.40.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.40.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.41.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.41.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.41.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.41.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.41.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.41.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.42.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.42.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.42.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.42.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.42.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.42.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.43.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.43.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.43.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.43.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.43.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.43.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.44.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.44.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.44.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.44.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.44.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.44.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.45.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.45.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.45.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.45.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.45.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.45.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.46.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.46.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.46.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.46.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.46.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.46.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.47.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.47.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.47.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.47.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.47.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.47.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.48.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.48.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.48.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.48.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.48.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.48.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.49.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.49.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.49.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.49.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.49.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.49.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.5.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.5.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.5.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.5.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.5.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.5.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.50.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.50.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.50.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.50.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.50.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.50.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.51.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.51.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.51.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.51.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.51.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.51.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.52.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.52.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.52.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.52.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.52.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.52.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.53.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.53.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.53.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.53.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.53.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.53.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.54.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.54.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.54.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.54.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.54.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.54.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.55.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.55.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.55.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.55.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.55.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.55.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.56.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.56.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.56.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.56.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.56.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.56.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.57.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.57.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.57.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.57.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.57.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.57.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.58.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.58.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.58.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.58.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.58.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.58.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.59.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.59.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.59.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.59.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.59.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.59.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.6.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.6.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.6.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.6.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.6.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.6.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.60.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.60.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.60.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.60.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.60.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.60.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.61.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.61.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.61.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.61.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.61.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.61.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.62.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.62.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.62.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.62.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.62.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.62.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.63.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.63.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.63.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.63.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.63.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.63.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.64.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.64.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.64.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.64.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.64.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.64.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.65.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.65.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.65.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.65.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.65.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.65.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.66.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.66.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.66.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.66.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.66.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.66.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.67.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.67.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.67.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.67.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.67.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.67.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.68.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.68.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.68.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.68.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.68.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.68.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.69.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.69.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.69.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.69.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.69.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.69.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.7.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.7.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.7.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.7.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.7.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.7.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.70.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.70.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.70.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.70.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.70.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.70.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.71.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.71.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.71.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.71.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.71.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.71.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.72.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.72.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.72.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.72.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.72.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.72.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.73.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.73.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.73.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.73.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.73.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.73.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.74.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.74.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.74.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.74.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.74.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.74.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.75.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.75.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.75.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.75.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.75.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.75.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.76.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.76.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.76.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.76.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.76.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.76.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.77.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.77.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.77.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.77.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.77.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.77.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.78.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.78.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.78.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.78.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.78.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.78.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.79.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.79.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.79.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.79.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.79.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.79.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.8.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.8.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.8.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.8.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.8.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.8.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.80.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.80.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.80.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.80.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.80.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.80.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.81.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.81.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.81.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.81.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.81.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.81.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.82.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.82.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.82.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.82.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.82.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.82.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.83.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.83.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.83.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.83.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.83.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.83.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.84.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.84.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.84.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.84.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.84.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.84.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.85.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.85.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.85.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.85.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.85.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.85.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.86.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.86.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.86.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.86.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.86.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.86.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.87.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.87.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.87.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.87.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.87.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.87.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.88.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.88.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.88.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.88.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.88.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.88.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.89.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.89.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.89.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.89.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.89.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.89.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.9.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.9.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.9.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.9.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.9.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.9.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.90.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.90.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.90.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.90.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.90.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.90.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.91.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.91.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.91.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.91.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.91.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.91.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.92.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.92.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.92.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.92.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.92.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.92.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.93.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.93.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.93.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.93.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.93.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.93.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.94.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.94.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.94.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.94.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.94.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.94.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.95.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.95.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.95.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.95.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.95.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.95.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.96.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.96.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.96.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.96.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.96.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.96.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.97.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.97.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.97.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.97.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.97.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.97.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.98.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.98.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.98.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.98.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.98.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.98.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.99.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.99.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.99.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.99.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.99.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.experts.99.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.gate.e_score_correction_bias": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.gate.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.shared_experts.down_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.shared_experts.down_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.shared_experts.gate_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.shared_experts.gate_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.shared_experts.up_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.mlp.shared_experts.up_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.post_attention_layernorm.weight": "model-00067-of-00092.safetensors", + "model.layers.66.self_attn.k_norm.weight": "model-00067-of-00092.safetensors", + "model.layers.66.self_attn.k_proj.bias": "model-00067-of-00092.safetensors", + "model.layers.66.self_attn.k_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.self_attn.k_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.self_attn.o_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.self_attn.o_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.self_attn.q_norm.weight": "model-00067-of-00092.safetensors", + "model.layers.66.self_attn.q_proj.bias": "model-00067-of-00092.safetensors", + "model.layers.66.self_attn.q_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.self_attn.q_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.66.self_attn.v_proj.bias": "model-00067-of-00092.safetensors", + "model.layers.66.self_attn.v_proj.weight": "model-00067-of-00092.safetensors", + "model.layers.66.self_attn.v_proj.weight_scale": "model-00067-of-00092.safetensors", + "model.layers.67.input_layernorm.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.0.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.0.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.0.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.0.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.0.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.0.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.1.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.1.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.1.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.1.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.1.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.1.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.10.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.10.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.10.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.10.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.10.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.10.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.100.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.100.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.100.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.100.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.100.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.100.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.101.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.101.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.101.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.101.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.101.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.101.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.102.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.102.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.102.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.102.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.102.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.102.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.103.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.103.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.103.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.103.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.103.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.103.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.104.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.104.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.104.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.104.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.104.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.104.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.105.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.105.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.105.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.105.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.105.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.105.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.106.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.106.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.106.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.106.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.106.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.106.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.107.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.107.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.107.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.107.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.107.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.107.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.108.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.108.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.108.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.108.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.108.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.108.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.109.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.109.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.109.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.109.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.109.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.109.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.11.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.11.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.11.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.11.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.11.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.11.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.110.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.110.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.110.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.110.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.110.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.110.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.111.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.111.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.111.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.111.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.111.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.111.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.112.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.112.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.112.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.112.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.112.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.112.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.113.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.113.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.113.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.113.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.113.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.113.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.114.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.114.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.114.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.114.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.114.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.114.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.115.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.115.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.115.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.115.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.115.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.115.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.116.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.116.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.116.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.116.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.116.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.116.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.117.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.117.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.117.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.117.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.117.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.117.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.118.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.118.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.118.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.118.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.118.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.118.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.119.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.119.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.119.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.119.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.119.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.119.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.12.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.12.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.12.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.12.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.12.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.12.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.120.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.120.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.120.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.120.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.120.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.120.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.121.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.121.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.121.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.121.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.121.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.121.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.122.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.122.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.122.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.122.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.122.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.122.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.123.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.123.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.123.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.123.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.123.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.123.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.124.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.124.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.124.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.124.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.124.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.124.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.125.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.125.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.125.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.125.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.125.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.125.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.126.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.126.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.126.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.126.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.126.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.126.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.127.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.127.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.127.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.127.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.127.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.127.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.128.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.128.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.128.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.128.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.128.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.128.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.129.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.129.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.129.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.129.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.129.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.129.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.13.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.13.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.13.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.13.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.13.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.13.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.130.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.130.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.130.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.130.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.130.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.130.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.131.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.131.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.131.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.131.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.131.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.131.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.132.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.132.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.132.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.132.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.132.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.132.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.133.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.133.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.133.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.133.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.133.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.133.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.134.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.134.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.134.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.134.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.134.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.134.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.135.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.135.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.135.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.135.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.135.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.135.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.136.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.136.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.136.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.136.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.136.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.136.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.137.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.137.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.137.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.137.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.137.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.137.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.138.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.138.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.138.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.138.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.138.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.138.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.139.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.139.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.139.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.139.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.139.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.139.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.14.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.14.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.14.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.14.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.14.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.14.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.140.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.140.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.140.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.140.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.140.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.140.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.141.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.141.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.141.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.141.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.141.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.141.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.142.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.142.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.142.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.142.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.142.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.142.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.143.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.143.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.143.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.143.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.143.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.143.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.144.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.144.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.144.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.144.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.144.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.144.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.145.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.145.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.145.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.145.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.145.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.145.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.146.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.146.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.146.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.146.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.146.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.146.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.147.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.147.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.147.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.147.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.147.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.147.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.148.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.148.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.148.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.148.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.148.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.148.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.149.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.149.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.149.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.149.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.149.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.149.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.15.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.15.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.15.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.15.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.15.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.15.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.150.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.150.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.150.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.150.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.150.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.150.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.151.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.151.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.151.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.151.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.151.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.151.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.152.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.152.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.152.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.152.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.152.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.152.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.153.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.153.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.153.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.153.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.153.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.153.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.154.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.154.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.154.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.154.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.154.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.154.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.155.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.155.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.155.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.155.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.155.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.155.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.156.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.156.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.156.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.156.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.156.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.156.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.157.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.157.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.157.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.157.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.157.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.157.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.158.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.158.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.158.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.158.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.158.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.158.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.159.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.159.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.159.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.159.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.159.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.159.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.16.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.16.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.16.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.16.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.16.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.16.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.17.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.17.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.17.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.17.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.17.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.17.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.18.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.18.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.18.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.18.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.18.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.18.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.19.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.19.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.19.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.19.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.19.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.19.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.2.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.2.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.2.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.2.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.2.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.2.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.20.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.20.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.20.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.20.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.20.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.20.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.21.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.21.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.21.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.21.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.21.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.21.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.22.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.22.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.22.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.22.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.22.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.22.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.23.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.23.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.23.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.23.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.23.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.23.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.24.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.24.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.24.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.24.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.24.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.24.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.25.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.25.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.25.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.25.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.25.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.25.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.26.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.26.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.26.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.26.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.26.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.26.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.27.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.27.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.27.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.27.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.27.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.27.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.28.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.28.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.28.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.28.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.28.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.28.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.29.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.29.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.29.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.29.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.29.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.29.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.3.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.3.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.3.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.3.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.3.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.3.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.30.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.30.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.30.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.30.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.30.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.30.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.31.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.31.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.31.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.31.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.31.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.31.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.32.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.32.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.32.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.32.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.32.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.32.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.33.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.33.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.33.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.33.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.33.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.33.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.34.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.34.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.34.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.34.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.34.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.34.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.35.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.35.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.35.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.35.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.35.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.35.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.36.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.36.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.36.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.36.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.36.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.36.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.37.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.37.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.37.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.37.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.37.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.37.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.38.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.38.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.38.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.38.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.38.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.38.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.39.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.39.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.39.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.39.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.39.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.39.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.4.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.4.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.4.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.4.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.4.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.4.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.40.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.40.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.40.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.40.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.40.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.40.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.41.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.41.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.41.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.41.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.41.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.41.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.42.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.42.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.42.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.42.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.42.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.42.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.43.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.43.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.43.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.43.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.43.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.43.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.44.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.44.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.44.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.44.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.44.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.44.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.45.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.45.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.45.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.45.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.45.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.45.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.46.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.46.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.46.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.46.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.46.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.46.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.47.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.47.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.47.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.47.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.47.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.47.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.48.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.48.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.48.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.48.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.48.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.48.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.49.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.49.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.49.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.49.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.49.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.49.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.5.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.5.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.5.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.5.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.5.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.5.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.50.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.50.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.50.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.50.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.50.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.50.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.51.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.51.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.51.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.51.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.51.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.51.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.52.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.52.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.52.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.52.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.52.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.52.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.53.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.53.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.53.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.53.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.53.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.53.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.54.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.54.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.54.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.54.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.54.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.54.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.55.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.55.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.55.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.55.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.55.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.55.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.56.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.56.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.56.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.56.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.56.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.56.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.57.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.57.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.57.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.57.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.57.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.57.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.58.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.58.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.58.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.58.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.58.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.58.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.59.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.59.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.59.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.59.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.59.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.59.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.6.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.6.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.6.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.6.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.6.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.6.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.60.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.60.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.60.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.60.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.60.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.60.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.61.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.61.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.61.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.61.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.61.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.61.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.62.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.62.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.62.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.62.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.62.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.62.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.63.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.63.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.63.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.63.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.63.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.63.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.64.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.64.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.64.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.64.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.64.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.64.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.65.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.65.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.65.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.65.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.65.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.65.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.66.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.66.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.66.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.66.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.66.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.66.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.67.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.67.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.67.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.67.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.67.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.67.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.68.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.68.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.68.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.68.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.68.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.68.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.69.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.69.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.69.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.69.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.69.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.69.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.7.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.7.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.7.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.7.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.7.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.7.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.70.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.70.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.70.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.70.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.70.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.70.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.71.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.71.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.71.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.71.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.71.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.71.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.72.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.72.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.72.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.72.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.72.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.72.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.73.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.73.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.73.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.73.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.73.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.73.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.74.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.74.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.74.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.74.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.74.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.74.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.75.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.75.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.75.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.75.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.75.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.75.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.76.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.76.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.76.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.76.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.76.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.76.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.77.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.77.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.77.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.77.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.77.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.77.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.78.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.78.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.78.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.78.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.78.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.78.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.79.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.79.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.79.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.79.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.79.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.79.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.8.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.8.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.8.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.8.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.8.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.8.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.80.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.80.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.80.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.80.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.80.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.80.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.81.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.81.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.81.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.81.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.81.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.81.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.82.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.82.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.82.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.82.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.82.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.82.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.83.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.83.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.83.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.83.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.83.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.83.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.84.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.84.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.84.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.84.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.84.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.84.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.85.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.85.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.85.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.85.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.85.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.85.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.86.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.86.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.86.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.86.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.86.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.86.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.87.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.87.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.87.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.87.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.87.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.87.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.88.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.88.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.88.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.88.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.88.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.88.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.89.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.89.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.89.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.89.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.89.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.89.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.9.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.9.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.9.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.9.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.9.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.9.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.90.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.90.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.90.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.90.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.90.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.90.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.91.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.91.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.91.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.91.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.91.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.91.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.92.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.92.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.92.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.92.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.92.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.92.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.93.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.93.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.93.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.93.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.93.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.93.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.94.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.94.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.94.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.94.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.94.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.94.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.95.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.95.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.95.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.95.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.95.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.95.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.96.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.96.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.96.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.96.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.96.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.96.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.97.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.97.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.97.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.97.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.97.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.97.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.98.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.98.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.98.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.98.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.98.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.98.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.99.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.99.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.99.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.99.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.99.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.experts.99.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.gate.e_score_correction_bias": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.gate.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.shared_experts.down_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.shared_experts.down_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.shared_experts.gate_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.shared_experts.gate_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.shared_experts.up_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.mlp.shared_experts.up_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.post_attention_layernorm.weight": "model-00068-of-00092.safetensors", + "model.layers.67.self_attn.k_norm.weight": "model-00068-of-00092.safetensors", + "model.layers.67.self_attn.k_proj.bias": "model-00068-of-00092.safetensors", + "model.layers.67.self_attn.k_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.self_attn.k_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.self_attn.o_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.self_attn.o_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.self_attn.q_norm.weight": "model-00068-of-00092.safetensors", + "model.layers.67.self_attn.q_proj.bias": "model-00068-of-00092.safetensors", + "model.layers.67.self_attn.q_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.self_attn.q_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.67.self_attn.v_proj.bias": "model-00068-of-00092.safetensors", + "model.layers.67.self_attn.v_proj.weight": "model-00068-of-00092.safetensors", + "model.layers.67.self_attn.v_proj.weight_scale": "model-00068-of-00092.safetensors", + "model.layers.68.input_layernorm.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.0.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.0.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.0.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.0.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.0.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.0.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.1.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.1.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.1.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.1.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.1.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.1.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.10.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.10.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.10.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.10.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.10.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.10.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.100.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.100.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.100.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.100.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.100.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.100.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.101.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.101.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.101.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.101.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.101.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.101.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.102.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.102.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.102.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.102.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.102.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.102.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.103.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.103.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.103.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.103.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.103.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.103.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.104.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.104.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.104.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.104.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.104.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.104.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.105.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.105.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.105.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.105.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.105.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.105.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.106.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.106.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.106.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.106.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.106.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.106.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.107.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.107.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.107.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.107.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.107.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.107.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.108.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.108.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.108.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.108.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.108.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.108.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.109.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.109.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.109.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.109.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.109.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.109.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.11.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.11.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.11.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.11.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.11.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.11.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.110.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.110.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.110.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.110.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.110.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.110.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.111.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.111.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.111.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.111.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.111.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.111.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.112.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.112.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.112.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.112.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.112.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.112.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.113.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.113.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.113.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.113.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.113.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.113.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.114.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.114.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.114.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.114.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.114.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.114.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.115.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.115.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.115.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.115.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.115.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.115.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.116.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.116.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.116.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.116.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.116.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.116.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.117.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.117.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.117.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.117.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.117.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.117.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.118.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.118.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.118.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.118.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.118.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.118.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.119.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.119.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.119.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.119.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.119.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.119.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.12.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.12.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.12.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.12.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.12.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.12.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.120.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.120.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.120.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.120.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.120.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.120.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.121.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.121.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.121.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.121.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.121.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.121.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.122.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.122.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.122.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.122.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.122.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.122.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.123.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.123.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.123.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.123.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.123.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.123.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.124.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.124.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.124.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.124.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.124.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.124.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.125.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.125.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.125.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.125.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.125.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.125.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.126.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.126.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.126.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.126.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.126.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.126.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.127.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.127.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.127.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.127.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.127.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.127.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.128.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.128.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.128.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.128.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.128.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.128.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.129.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.129.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.129.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.129.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.129.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.129.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.13.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.13.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.13.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.13.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.13.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.13.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.130.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.130.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.130.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.130.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.130.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.130.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.131.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.131.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.131.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.131.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.131.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.131.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.132.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.132.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.132.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.132.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.132.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.132.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.133.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.133.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.133.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.133.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.133.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.133.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.134.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.134.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.134.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.134.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.134.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.134.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.135.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.135.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.135.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.135.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.135.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.135.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.136.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.136.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.136.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.136.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.136.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.136.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.137.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.137.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.137.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.137.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.137.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.137.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.138.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.138.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.138.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.138.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.138.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.138.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.139.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.139.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.139.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.139.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.139.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.139.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.14.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.14.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.14.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.14.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.14.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.14.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.140.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.140.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.140.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.140.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.140.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.140.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.141.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.141.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.141.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.141.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.141.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.141.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.142.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.142.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.142.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.142.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.142.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.142.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.143.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.143.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.143.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.143.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.143.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.143.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.144.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.144.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.144.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.144.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.144.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.144.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.145.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.145.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.145.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.145.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.145.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.145.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.146.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.146.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.146.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.146.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.146.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.146.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.147.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.147.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.147.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.147.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.147.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.147.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.148.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.148.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.148.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.148.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.148.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.148.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.149.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.149.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.149.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.149.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.149.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.149.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.15.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.15.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.15.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.15.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.15.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.15.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.150.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.150.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.150.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.150.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.150.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.150.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.151.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.151.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.151.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.151.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.151.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.151.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.152.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.152.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.152.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.152.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.152.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.152.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.153.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.153.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.153.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.153.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.153.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.153.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.154.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.154.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.154.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.154.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.154.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.154.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.155.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.155.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.155.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.155.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.155.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.155.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.156.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.156.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.156.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.156.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.156.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.156.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.157.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.157.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.157.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.157.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.157.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.157.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.158.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.158.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.158.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.158.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.158.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.158.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.159.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.159.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.159.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.159.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.159.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.159.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.16.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.16.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.16.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.16.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.16.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.16.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.17.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.17.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.17.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.17.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.17.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.17.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.18.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.18.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.18.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.18.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.18.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.18.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.19.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.19.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.19.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.19.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.19.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.19.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.2.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.2.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.2.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.2.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.2.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.2.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.20.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.20.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.20.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.20.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.20.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.20.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.21.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.21.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.21.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.21.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.21.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.21.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.22.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.22.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.22.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.22.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.22.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.22.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.23.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.23.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.23.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.23.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.23.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.23.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.24.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.24.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.24.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.24.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.24.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.24.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.25.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.25.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.25.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.25.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.25.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.25.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.26.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.26.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.26.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.26.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.26.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.26.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.27.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.27.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.27.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.27.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.27.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.27.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.28.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.28.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.28.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.28.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.28.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.28.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.29.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.29.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.29.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.29.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.29.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.29.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.3.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.3.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.3.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.3.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.3.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.3.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.30.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.30.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.30.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.30.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.30.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.30.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.31.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.31.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.31.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.31.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.31.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.31.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.32.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.32.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.32.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.32.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.32.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.32.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.33.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.33.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.33.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.33.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.33.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.33.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.34.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.34.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.34.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.34.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.34.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.34.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.35.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.35.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.35.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.35.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.35.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.35.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.36.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.36.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.36.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.36.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.36.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.36.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.37.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.37.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.37.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.37.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.37.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.37.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.38.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.38.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.38.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.38.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.38.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.38.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.39.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.39.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.39.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.39.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.39.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.39.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.4.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.4.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.4.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.4.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.4.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.4.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.40.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.40.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.40.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.40.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.40.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.40.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.41.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.41.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.41.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.41.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.41.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.41.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.42.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.42.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.42.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.42.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.42.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.42.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.43.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.43.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.43.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.43.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.43.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.43.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.44.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.44.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.44.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.44.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.44.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.44.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.45.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.45.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.45.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.45.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.45.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.45.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.46.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.46.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.46.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.46.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.46.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.46.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.47.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.47.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.47.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.47.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.47.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.47.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.48.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.48.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.48.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.48.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.48.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.48.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.49.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.49.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.49.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.49.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.49.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.49.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.5.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.5.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.5.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.5.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.5.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.5.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.50.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.50.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.50.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.50.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.50.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.50.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.51.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.51.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.51.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.51.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.51.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.51.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.52.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.52.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.52.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.52.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.52.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.52.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.53.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.53.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.53.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.53.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.53.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.53.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.54.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.54.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.54.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.54.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.54.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.54.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.55.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.55.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.55.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.55.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.55.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.55.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.56.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.56.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.56.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.56.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.56.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.56.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.57.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.57.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.57.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.57.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.57.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.57.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.58.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.58.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.58.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.58.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.58.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.58.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.59.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.59.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.59.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.59.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.59.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.59.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.6.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.6.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.6.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.6.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.6.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.6.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.60.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.60.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.60.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.60.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.60.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.60.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.61.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.61.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.61.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.61.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.61.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.61.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.62.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.62.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.62.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.62.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.62.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.62.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.63.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.63.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.63.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.63.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.63.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.63.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.64.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.64.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.64.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.64.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.64.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.64.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.65.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.65.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.65.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.65.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.65.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.65.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.66.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.66.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.66.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.66.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.66.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.66.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.67.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.67.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.67.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.67.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.67.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.67.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.68.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.68.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.68.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.68.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.68.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.68.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.69.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.69.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.69.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.69.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.69.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.69.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.7.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.7.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.7.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.7.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.7.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.7.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.70.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.70.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.70.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.70.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.70.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.70.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.71.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.71.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.71.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.71.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.71.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.71.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.72.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.72.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.72.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.72.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.72.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.72.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.73.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.73.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.73.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.73.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.73.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.73.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.74.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.74.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.74.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.74.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.74.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.74.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.75.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.75.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.75.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.75.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.75.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.75.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.76.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.76.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.76.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.76.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.76.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.76.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.77.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.77.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.77.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.77.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.77.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.77.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.78.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.78.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.78.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.78.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.78.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.78.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.79.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.79.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.79.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.79.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.79.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.79.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.8.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.8.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.8.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.8.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.8.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.8.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.80.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.80.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.80.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.80.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.80.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.80.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.81.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.81.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.81.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.81.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.81.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.81.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.82.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.82.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.82.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.82.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.82.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.82.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.83.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.83.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.83.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.83.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.83.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.83.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.84.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.84.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.84.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.84.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.84.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.84.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.85.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.85.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.85.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.85.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.85.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.85.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.86.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.86.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.86.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.86.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.86.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.86.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.87.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.87.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.87.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.87.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.87.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.87.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.88.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.88.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.88.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.88.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.88.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.88.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.89.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.89.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.89.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.89.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.89.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.89.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.9.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.9.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.9.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.9.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.9.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.9.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.90.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.90.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.90.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.90.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.90.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.90.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.91.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.91.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.91.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.91.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.91.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.91.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.92.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.92.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.92.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.92.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.92.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.92.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.93.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.93.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.93.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.93.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.93.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.93.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.94.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.94.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.94.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.94.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.94.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.94.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.95.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.95.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.95.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.95.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.95.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.95.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.96.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.96.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.96.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.96.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.96.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.96.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.97.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.97.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.97.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.97.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.97.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.97.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.98.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.98.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.98.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.98.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.98.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.98.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.99.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.99.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.99.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.99.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.99.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.experts.99.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.gate.e_score_correction_bias": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.gate.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.shared_experts.down_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.shared_experts.down_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.shared_experts.gate_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.shared_experts.gate_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.shared_experts.up_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.mlp.shared_experts.up_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.post_attention_layernorm.weight": "model-00069-of-00092.safetensors", + "model.layers.68.self_attn.k_norm.weight": "model-00069-of-00092.safetensors", + "model.layers.68.self_attn.k_proj.bias": "model-00069-of-00092.safetensors", + "model.layers.68.self_attn.k_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.self_attn.k_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.self_attn.o_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.self_attn.o_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.self_attn.q_norm.weight": "model-00069-of-00092.safetensors", + "model.layers.68.self_attn.q_proj.bias": "model-00069-of-00092.safetensors", + "model.layers.68.self_attn.q_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.self_attn.q_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.68.self_attn.v_proj.bias": "model-00069-of-00092.safetensors", + "model.layers.68.self_attn.v_proj.weight": "model-00069-of-00092.safetensors", + "model.layers.68.self_attn.v_proj.weight_scale": "model-00069-of-00092.safetensors", + "model.layers.69.input_layernorm.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.0.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.0.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.0.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.0.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.0.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.0.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.1.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.1.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.1.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.1.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.1.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.1.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.10.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.10.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.10.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.10.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.10.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.10.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.100.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.100.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.100.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.100.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.100.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.100.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.101.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.101.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.101.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.101.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.101.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.101.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.102.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.102.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.102.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.102.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.102.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.102.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.103.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.103.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.103.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.103.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.103.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.103.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.104.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.104.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.104.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.104.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.104.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.104.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.105.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.105.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.105.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.105.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.105.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.105.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.106.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.106.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.106.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.106.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.106.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.106.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.107.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.107.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.107.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.107.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.107.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.107.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.108.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.108.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.108.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.108.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.108.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.108.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.109.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.109.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.109.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.109.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.109.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.109.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.11.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.11.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.11.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.11.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.11.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.11.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.110.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.110.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.110.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.110.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.110.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.110.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.111.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.111.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.111.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.111.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.111.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.111.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.112.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.112.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.112.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.112.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.112.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.112.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.113.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.113.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.113.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.113.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.113.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.113.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.114.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.114.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.114.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.114.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.114.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.114.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.115.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.115.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.115.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.115.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.115.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.115.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.116.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.116.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.116.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.116.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.116.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.116.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.117.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.117.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.117.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.117.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.117.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.117.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.118.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.118.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.118.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.118.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.118.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.118.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.119.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.119.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.119.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.119.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.119.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.119.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.12.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.12.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.12.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.12.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.12.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.12.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.120.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.120.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.120.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.120.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.120.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.120.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.121.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.121.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.121.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.121.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.121.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.121.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.122.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.122.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.122.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.122.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.122.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.122.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.123.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.123.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.123.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.123.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.123.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.123.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.124.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.124.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.124.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.124.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.124.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.124.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.125.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.125.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.125.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.125.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.125.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.125.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.126.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.126.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.126.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.126.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.126.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.126.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.127.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.127.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.127.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.127.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.127.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.127.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.128.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.128.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.128.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.128.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.128.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.128.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.129.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.129.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.129.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.129.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.129.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.129.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.13.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.13.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.13.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.13.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.13.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.13.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.130.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.130.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.130.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.130.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.130.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.130.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.131.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.131.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.131.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.131.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.131.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.131.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.132.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.132.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.132.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.132.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.132.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.132.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.133.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.133.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.133.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.133.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.133.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.133.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.134.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.134.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.134.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.134.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.134.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.134.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.135.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.135.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.135.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.135.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.135.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.135.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.136.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.136.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.136.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.136.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.136.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.136.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.137.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.137.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.137.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.137.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.137.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.137.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.138.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.138.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.138.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.138.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.138.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.138.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.139.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.139.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.139.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.139.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.139.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.139.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.14.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.14.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.14.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.14.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.14.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.14.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.140.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.140.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.140.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.140.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.140.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.140.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.141.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.141.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.141.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.141.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.141.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.141.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.142.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.142.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.142.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.142.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.142.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.142.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.143.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.143.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.143.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.143.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.143.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.143.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.144.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.144.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.144.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.144.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.144.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.144.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.145.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.145.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.145.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.145.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.145.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.145.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.146.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.146.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.146.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.146.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.146.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.146.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.147.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.147.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.147.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.147.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.147.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.147.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.148.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.148.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.148.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.148.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.148.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.148.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.149.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.149.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.149.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.149.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.149.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.149.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.15.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.15.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.15.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.15.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.15.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.15.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.150.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.150.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.150.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.150.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.150.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.150.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.151.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.151.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.151.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.151.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.151.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.151.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.152.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.152.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.152.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.152.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.152.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.152.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.153.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.153.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.153.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.153.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.153.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.153.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.154.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.154.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.154.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.154.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.154.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.154.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.155.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.155.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.155.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.155.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.155.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.155.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.156.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.156.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.156.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.156.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.156.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.156.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.157.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.157.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.157.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.157.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.157.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.157.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.158.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.158.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.158.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.158.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.158.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.158.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.159.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.159.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.159.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.159.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.159.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.159.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.16.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.16.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.16.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.16.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.16.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.16.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.17.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.17.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.17.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.17.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.17.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.17.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.18.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.18.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.18.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.18.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.18.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.18.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.19.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.19.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.19.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.19.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.19.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.19.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.2.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.2.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.2.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.2.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.2.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.2.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.20.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.20.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.20.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.20.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.20.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.20.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.21.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.21.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.21.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.21.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.21.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.21.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.22.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.22.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.22.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.22.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.22.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.22.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.23.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.23.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.23.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.23.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.23.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.23.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.24.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.24.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.24.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.24.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.24.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.24.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.25.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.25.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.25.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.25.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.25.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.25.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.26.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.26.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.26.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.26.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.26.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.26.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.27.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.27.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.27.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.27.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.27.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.27.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.28.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.28.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.28.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.28.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.28.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.28.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.29.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.29.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.29.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.29.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.29.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.29.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.3.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.3.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.3.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.3.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.3.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.3.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.30.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.30.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.30.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.30.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.30.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.30.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.31.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.31.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.31.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.31.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.31.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.31.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.32.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.32.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.32.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.32.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.32.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.32.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.33.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.33.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.33.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.33.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.33.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.33.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.34.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.34.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.34.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.34.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.34.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.34.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.35.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.35.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.35.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.35.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.35.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.35.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.36.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.36.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.36.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.36.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.36.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.36.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.37.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.37.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.37.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.37.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.37.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.37.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.38.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.38.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.38.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.38.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.38.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.38.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.39.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.39.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.39.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.39.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.39.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.39.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.4.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.4.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.4.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.4.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.4.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.4.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.40.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.40.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.40.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.40.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.40.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.40.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.41.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.41.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.41.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.41.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.41.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.41.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.42.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.42.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.42.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.42.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.42.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.42.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.43.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.43.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.43.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.43.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.43.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.43.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.44.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.44.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.44.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.44.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.44.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.44.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.45.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.45.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.45.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.45.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.45.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.45.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.46.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.46.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.46.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.46.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.46.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.46.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.47.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.47.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.47.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.47.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.47.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.47.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.48.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.48.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.48.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.48.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.48.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.48.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.49.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.49.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.49.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.49.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.49.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.49.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.5.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.5.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.5.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.5.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.5.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.5.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.50.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.50.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.50.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.50.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.50.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.50.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.51.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.51.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.51.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.51.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.51.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.51.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.52.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.52.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.52.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.52.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.52.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.52.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.53.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.53.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.53.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.53.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.53.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.53.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.54.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.54.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.54.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.54.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.54.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.54.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.55.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.55.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.55.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.55.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.55.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.55.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.56.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.56.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.56.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.56.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.56.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.56.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.57.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.57.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.57.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.57.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.57.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.57.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.58.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.58.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.58.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.58.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.58.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.58.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.59.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.59.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.59.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.59.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.59.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.59.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.6.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.6.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.6.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.6.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.6.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.6.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.60.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.60.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.60.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.60.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.60.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.60.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.61.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.61.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.61.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.61.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.61.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.61.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.62.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.62.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.62.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.62.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.62.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.62.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.63.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.63.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.63.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.63.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.63.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.63.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.64.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.64.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.64.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.64.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.64.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.64.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.65.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.65.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.65.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.65.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.65.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.65.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.66.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.66.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.66.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.66.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.66.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.66.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.67.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.67.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.67.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.67.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.67.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.67.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.68.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.68.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.68.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.68.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.68.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.68.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.69.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.69.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.69.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.69.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.69.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.69.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.7.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.7.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.7.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.7.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.7.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.7.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.70.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.70.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.70.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.70.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.70.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.70.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.71.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.71.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.71.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.71.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.71.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.71.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.72.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.72.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.72.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.72.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.72.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.72.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.73.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.73.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.73.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.73.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.73.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.73.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.74.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.74.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.74.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.74.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.74.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.74.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.75.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.75.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.75.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.75.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.75.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.75.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.76.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.76.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.76.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.76.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.76.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.76.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.77.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.77.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.77.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.77.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.77.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.77.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.78.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.78.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.78.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.78.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.78.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.78.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.79.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.79.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.79.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.79.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.79.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.79.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.8.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.8.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.8.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.8.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.8.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.8.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.80.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.80.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.80.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.80.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.80.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.80.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.81.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.81.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.81.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.81.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.81.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.81.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.82.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.82.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.82.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.82.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.82.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.82.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.83.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.83.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.83.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.83.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.83.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.83.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.84.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.84.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.84.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.84.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.84.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.84.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.85.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.85.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.85.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.85.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.85.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.85.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.86.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.86.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.86.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.86.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.86.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.86.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.87.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.87.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.87.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.87.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.87.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.87.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.88.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.88.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.88.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.88.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.88.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.88.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.89.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.89.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.89.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.89.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.89.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.89.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.9.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.9.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.9.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.9.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.9.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.9.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.90.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.90.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.90.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.90.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.90.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.90.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.91.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.91.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.91.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.91.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.91.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.91.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.92.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.92.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.92.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.92.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.92.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.92.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.93.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.93.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.93.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.93.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.93.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.93.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.94.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.94.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.94.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.94.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.94.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.94.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.95.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.95.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.95.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.95.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.95.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.95.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.96.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.96.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.96.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.96.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.96.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.96.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.97.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.97.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.97.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.97.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.97.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.97.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.98.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.98.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.98.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.98.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.98.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.98.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.99.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.99.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.99.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.99.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.99.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.experts.99.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.gate.e_score_correction_bias": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.gate.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.shared_experts.down_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.shared_experts.down_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.shared_experts.gate_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.shared_experts.gate_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.shared_experts.up_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.mlp.shared_experts.up_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.post_attention_layernorm.weight": "model-00070-of-00092.safetensors", + "model.layers.69.self_attn.k_norm.weight": "model-00070-of-00092.safetensors", + "model.layers.69.self_attn.k_proj.bias": "model-00070-of-00092.safetensors", + "model.layers.69.self_attn.k_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.self_attn.k_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.self_attn.o_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.self_attn.o_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.self_attn.q_norm.weight": "model-00070-of-00092.safetensors", + "model.layers.69.self_attn.q_proj.bias": "model-00070-of-00092.safetensors", + "model.layers.69.self_attn.q_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.self_attn.q_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.69.self_attn.v_proj.bias": "model-00070-of-00092.safetensors", + "model.layers.69.self_attn.v_proj.weight": "model-00070-of-00092.safetensors", + "model.layers.69.self_attn.v_proj.weight_scale": "model-00070-of-00092.safetensors", + "model.layers.70.input_layernorm.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.0.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.0.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.0.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.0.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.0.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.0.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.1.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.1.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.1.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.1.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.1.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.1.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.10.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.10.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.10.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.10.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.10.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.10.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.100.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.100.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.100.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.100.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.100.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.100.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.101.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.101.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.101.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.101.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.101.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.101.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.102.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.102.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.102.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.102.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.102.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.102.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.103.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.103.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.103.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.103.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.103.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.103.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.104.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.104.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.104.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.104.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.104.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.104.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.105.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.105.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.105.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.105.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.105.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.105.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.106.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.106.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.106.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.106.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.106.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.106.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.107.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.107.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.107.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.107.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.107.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.107.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.108.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.108.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.108.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.108.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.108.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.108.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.109.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.109.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.109.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.109.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.109.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.109.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.11.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.11.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.11.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.11.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.11.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.11.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.110.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.110.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.110.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.110.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.110.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.110.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.111.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.111.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.111.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.111.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.111.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.111.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.112.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.112.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.112.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.112.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.112.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.112.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.113.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.113.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.113.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.113.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.113.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.113.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.114.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.114.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.114.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.114.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.114.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.114.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.115.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.115.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.115.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.115.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.115.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.115.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.116.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.116.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.116.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.116.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.116.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.116.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.117.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.117.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.117.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.117.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.117.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.117.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.118.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.118.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.118.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.118.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.118.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.118.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.119.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.119.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.119.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.119.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.119.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.119.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.12.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.12.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.12.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.12.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.12.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.12.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.120.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.120.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.120.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.120.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.120.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.120.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.121.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.121.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.121.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.121.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.121.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.121.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.122.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.122.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.122.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.122.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.122.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.122.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.123.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.123.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.123.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.123.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.123.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.123.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.124.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.124.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.124.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.124.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.124.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.124.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.125.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.125.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.125.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.125.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.125.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.125.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.126.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.126.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.126.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.126.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.126.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.126.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.127.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.127.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.127.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.127.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.127.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.127.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.128.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.128.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.128.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.128.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.128.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.128.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.129.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.129.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.129.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.129.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.129.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.129.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.13.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.13.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.13.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.13.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.13.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.13.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.130.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.130.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.130.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.130.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.130.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.130.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.131.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.131.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.131.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.131.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.131.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.131.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.132.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.132.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.132.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.132.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.132.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.132.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.133.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.133.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.133.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.133.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.133.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.133.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.134.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.134.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.134.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.134.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.134.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.134.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.135.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.135.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.135.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.135.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.135.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.135.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.136.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.136.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.136.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.136.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.136.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.136.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.137.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.137.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.137.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.137.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.137.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.137.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.138.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.138.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.138.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.138.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.138.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.138.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.139.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.139.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.139.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.139.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.139.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.139.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.14.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.14.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.14.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.14.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.14.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.14.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.140.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.140.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.140.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.140.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.140.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.140.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.141.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.141.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.141.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.141.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.141.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.141.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.142.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.142.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.142.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.142.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.142.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.142.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.143.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.143.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.143.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.143.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.143.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.143.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.144.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.144.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.144.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.144.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.144.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.144.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.145.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.145.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.145.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.145.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.145.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.145.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.146.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.146.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.146.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.146.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.146.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.146.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.147.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.147.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.147.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.147.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.147.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.147.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.148.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.148.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.148.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.148.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.148.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.148.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.149.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.149.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.149.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.149.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.149.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.149.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.15.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.15.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.15.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.15.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.15.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.15.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.150.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.150.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.150.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.150.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.150.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.150.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.151.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.151.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.151.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.151.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.151.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.151.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.152.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.152.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.152.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.152.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.152.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.152.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.153.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.153.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.153.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.153.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.153.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.153.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.154.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.154.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.154.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.154.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.154.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.154.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.155.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.155.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.155.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.155.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.155.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.155.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.156.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.156.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.156.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.156.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.156.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.156.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.157.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.157.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.157.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.157.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.157.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.157.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.158.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.158.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.158.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.158.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.158.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.158.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.159.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.159.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.159.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.159.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.159.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.159.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.16.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.16.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.16.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.16.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.16.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.16.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.17.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.17.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.17.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.17.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.17.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.17.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.18.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.18.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.18.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.18.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.18.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.18.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.19.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.19.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.19.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.19.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.19.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.19.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.2.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.2.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.2.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.2.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.2.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.2.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.20.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.20.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.20.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.20.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.20.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.20.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.21.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.21.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.21.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.21.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.21.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.21.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.22.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.22.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.22.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.22.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.22.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.22.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.23.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.23.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.23.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.23.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.23.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.23.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.24.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.24.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.24.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.24.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.24.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.24.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.25.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.25.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.25.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.25.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.25.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.25.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.26.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.26.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.26.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.26.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.26.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.26.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.27.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.27.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.27.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.27.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.27.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.27.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.28.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.28.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.28.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.28.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.28.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.28.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.29.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.29.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.29.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.29.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.29.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.29.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.3.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.3.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.3.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.3.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.3.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.3.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.30.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.30.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.30.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.30.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.30.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.30.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.31.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.31.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.31.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.31.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.31.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.31.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.32.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.32.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.32.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.32.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.32.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.32.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.33.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.33.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.33.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.33.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.33.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.33.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.34.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.34.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.34.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.34.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.34.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.34.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.35.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.35.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.35.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.35.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.35.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.35.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.36.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.36.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.36.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.36.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.36.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.36.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.37.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.37.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.37.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.37.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.37.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.37.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.38.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.38.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.38.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.38.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.38.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.38.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.39.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.39.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.39.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.39.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.39.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.39.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.4.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.4.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.4.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.4.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.4.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.4.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.40.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.40.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.40.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.40.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.40.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.40.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.41.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.41.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.41.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.41.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.41.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.41.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.42.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.42.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.42.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.42.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.42.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.42.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.43.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.43.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.43.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.43.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.43.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.43.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.44.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.44.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.44.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.44.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.44.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.44.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.45.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.45.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.45.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.45.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.45.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.45.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.46.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.46.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.46.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.46.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.46.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.46.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.47.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.47.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.47.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.47.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.47.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.47.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.48.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.48.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.48.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.48.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.48.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.48.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.49.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.49.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.49.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.49.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.49.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.49.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.5.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.5.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.5.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.5.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.5.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.5.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.50.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.50.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.50.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.50.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.50.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.50.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.51.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.51.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.51.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.51.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.51.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.51.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.52.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.52.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.52.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.52.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.52.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.52.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.53.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.53.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.53.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.53.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.53.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.53.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.54.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.54.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.54.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.54.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.54.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.54.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.55.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.55.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.55.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.55.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.55.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.55.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.56.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.56.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.56.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.56.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.56.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.56.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.57.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.57.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.57.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.57.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.57.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.57.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.58.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.58.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.58.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.58.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.58.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.58.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.59.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.59.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.59.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.59.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.59.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.59.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.6.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.6.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.6.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.6.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.6.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.6.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.60.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.60.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.60.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.60.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.60.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.60.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.61.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.61.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.61.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.61.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.61.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.61.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.62.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.62.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.62.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.62.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.62.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.62.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.63.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.63.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.63.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.63.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.63.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.63.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.64.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.64.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.64.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.64.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.64.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.64.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.65.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.65.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.65.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.65.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.65.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.65.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.66.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.66.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.66.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.66.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.66.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.66.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.67.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.67.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.67.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.67.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.67.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.67.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.68.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.68.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.68.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.68.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.68.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.68.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.69.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.69.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.69.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.69.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.69.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.69.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.7.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.7.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.7.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.7.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.7.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.7.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.70.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.70.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.70.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.70.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.70.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.70.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.71.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.71.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.71.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.71.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.71.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.71.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.72.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.72.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.72.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.72.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.72.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.72.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.73.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.73.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.73.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.73.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.73.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.73.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.74.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.74.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.74.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.74.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.74.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.74.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.75.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.75.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.75.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.75.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.75.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.75.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.76.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.76.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.76.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.76.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.76.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.76.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.77.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.77.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.77.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.77.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.77.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.77.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.78.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.78.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.78.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.78.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.78.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.78.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.79.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.79.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.79.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.79.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.79.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.79.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.8.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.8.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.8.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.8.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.8.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.8.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.80.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.80.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.80.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.80.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.80.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.80.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.81.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.81.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.81.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.81.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.81.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.81.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.82.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.82.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.82.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.82.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.82.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.82.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.83.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.83.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.83.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.83.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.83.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.83.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.84.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.84.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.84.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.84.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.84.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.84.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.85.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.85.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.85.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.85.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.85.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.85.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.86.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.86.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.86.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.86.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.86.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.86.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.87.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.87.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.87.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.87.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.87.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.87.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.88.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.88.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.88.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.88.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.88.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.88.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.89.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.89.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.89.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.89.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.89.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.89.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.9.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.9.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.9.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.9.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.9.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.9.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.90.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.90.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.90.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.90.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.90.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.90.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.91.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.91.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.91.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.91.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.91.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.91.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.92.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.92.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.92.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.92.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.92.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.92.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.93.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.93.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.93.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.93.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.93.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.93.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.94.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.94.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.94.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.94.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.94.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.94.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.95.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.95.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.95.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.95.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.95.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.95.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.96.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.96.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.96.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.96.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.96.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.96.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.97.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.97.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.97.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.97.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.97.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.97.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.98.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.98.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.98.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.98.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.98.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.98.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.99.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.99.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.99.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.99.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.99.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.experts.99.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.gate.e_score_correction_bias": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.gate.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.shared_experts.down_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.shared_experts.down_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.shared_experts.gate_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.shared_experts.gate_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.shared_experts.up_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.mlp.shared_experts.up_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.post_attention_layernorm.weight": "model-00071-of-00092.safetensors", + "model.layers.70.self_attn.k_norm.weight": "model-00071-of-00092.safetensors", + "model.layers.70.self_attn.k_proj.bias": "model-00071-of-00092.safetensors", + "model.layers.70.self_attn.k_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.self_attn.k_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.self_attn.o_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.self_attn.o_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.self_attn.q_norm.weight": "model-00071-of-00092.safetensors", + "model.layers.70.self_attn.q_proj.bias": "model-00071-of-00092.safetensors", + "model.layers.70.self_attn.q_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.self_attn.q_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.70.self_attn.v_proj.bias": "model-00071-of-00092.safetensors", + "model.layers.70.self_attn.v_proj.weight": "model-00071-of-00092.safetensors", + "model.layers.70.self_attn.v_proj.weight_scale": "model-00071-of-00092.safetensors", + "model.layers.71.input_layernorm.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.0.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.0.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.0.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.0.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.0.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.0.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.1.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.1.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.1.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.1.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.1.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.1.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.10.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.10.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.10.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.10.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.10.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.10.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.100.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.100.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.100.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.100.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.100.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.100.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.101.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.101.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.101.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.101.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.101.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.101.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.102.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.102.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.102.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.102.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.102.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.102.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.103.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.103.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.103.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.103.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.103.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.103.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.104.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.104.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.104.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.104.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.104.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.104.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.105.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.105.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.105.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.105.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.105.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.105.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.106.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.106.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.106.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.106.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.106.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.106.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.107.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.107.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.107.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.107.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.107.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.107.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.108.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.108.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.108.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.108.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.108.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.108.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.109.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.109.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.109.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.109.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.109.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.109.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.11.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.11.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.11.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.11.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.11.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.11.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.110.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.110.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.110.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.110.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.110.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.110.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.111.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.111.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.111.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.111.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.111.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.111.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.112.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.112.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.112.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.112.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.112.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.112.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.113.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.113.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.113.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.113.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.113.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.113.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.114.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.114.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.114.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.114.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.114.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.114.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.115.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.115.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.115.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.115.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.115.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.115.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.116.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.116.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.116.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.116.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.116.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.116.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.117.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.117.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.117.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.117.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.117.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.117.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.118.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.118.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.118.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.118.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.118.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.118.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.119.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.119.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.119.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.119.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.119.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.119.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.12.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.12.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.12.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.12.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.12.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.12.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.120.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.120.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.120.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.120.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.120.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.120.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.121.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.121.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.121.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.121.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.121.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.121.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.122.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.122.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.122.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.122.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.122.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.122.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.123.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.123.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.123.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.123.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.123.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.123.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.124.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.124.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.124.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.124.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.124.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.124.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.125.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.125.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.125.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.125.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.125.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.125.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.126.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.126.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.126.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.126.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.126.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.126.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.127.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.127.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.127.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.127.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.127.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.127.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.128.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.128.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.128.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.128.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.128.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.128.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.129.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.129.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.129.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.129.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.129.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.129.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.13.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.13.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.13.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.13.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.13.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.13.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.130.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.130.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.130.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.130.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.130.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.130.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.131.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.131.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.131.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.131.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.131.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.131.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.132.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.132.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.132.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.132.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.132.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.132.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.133.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.133.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.133.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.133.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.133.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.133.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.134.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.134.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.134.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.134.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.134.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.134.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.135.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.135.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.135.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.135.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.135.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.135.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.136.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.136.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.136.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.136.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.136.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.136.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.137.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.137.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.137.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.137.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.137.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.137.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.138.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.138.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.138.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.138.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.138.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.138.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.139.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.139.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.139.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.139.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.139.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.139.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.14.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.14.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.14.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.14.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.14.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.14.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.140.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.140.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.140.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.140.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.140.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.140.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.141.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.141.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.141.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.141.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.141.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.141.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.142.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.142.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.142.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.142.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.142.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.142.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.143.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.143.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.143.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.143.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.143.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.143.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.144.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.144.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.144.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.144.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.144.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.144.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.145.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.145.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.145.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.145.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.145.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.145.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.146.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.146.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.146.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.146.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.146.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.146.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.147.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.147.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.147.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.147.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.147.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.147.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.148.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.148.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.148.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.148.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.148.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.148.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.149.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.149.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.149.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.149.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.149.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.149.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.15.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.15.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.15.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.15.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.15.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.15.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.150.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.150.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.150.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.150.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.150.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.150.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.151.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.151.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.151.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.151.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.151.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.151.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.152.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.152.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.152.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.152.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.152.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.152.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.153.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.153.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.153.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.153.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.153.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.153.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.154.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.154.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.154.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.154.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.154.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.154.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.155.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.155.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.155.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.155.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.155.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.155.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.156.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.156.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.156.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.156.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.156.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.156.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.157.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.157.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.157.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.157.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.157.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.157.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.158.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.158.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.158.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.158.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.158.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.158.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.159.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.159.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.159.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.159.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.159.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.159.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.16.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.16.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.16.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.16.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.16.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.16.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.17.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.17.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.17.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.17.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.17.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.17.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.18.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.18.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.18.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.18.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.18.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.18.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.19.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.19.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.19.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.19.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.19.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.19.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.2.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.2.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.2.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.2.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.2.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.2.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.20.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.20.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.20.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.20.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.20.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.20.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.21.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.21.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.21.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.21.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.21.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.21.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.22.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.22.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.22.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.22.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.22.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.22.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.23.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.23.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.23.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.23.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.23.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.23.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.24.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.24.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.24.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.24.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.24.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.24.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.25.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.25.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.25.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.25.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.25.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.25.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.26.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.26.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.26.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.26.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.26.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.26.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.27.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.27.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.27.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.27.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.27.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.27.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.28.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.28.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.28.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.28.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.28.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.28.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.29.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.29.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.29.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.29.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.29.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.29.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.3.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.3.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.3.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.3.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.3.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.3.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.30.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.30.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.30.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.30.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.30.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.30.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.31.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.31.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.31.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.31.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.31.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.31.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.32.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.32.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.32.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.32.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.32.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.32.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.33.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.33.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.33.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.33.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.33.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.33.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.34.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.34.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.34.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.34.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.34.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.34.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.35.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.35.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.35.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.35.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.35.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.35.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.36.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.36.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.36.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.36.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.36.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.36.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.37.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.37.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.37.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.37.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.37.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.37.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.38.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.38.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.38.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.38.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.38.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.38.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.39.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.39.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.39.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.39.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.39.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.39.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.4.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.4.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.4.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.4.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.4.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.4.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.40.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.40.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.40.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.40.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.40.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.40.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.41.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.41.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.41.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.41.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.41.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.41.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.42.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.42.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.42.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.42.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.42.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.42.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.43.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.43.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.43.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.43.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.43.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.43.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.44.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.44.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.44.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.44.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.44.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.44.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.45.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.45.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.45.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.45.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.45.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.45.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.46.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.46.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.46.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.46.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.46.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.46.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.47.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.47.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.47.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.47.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.47.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.47.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.48.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.48.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.48.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.48.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.48.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.48.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.49.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.49.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.49.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.49.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.49.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.49.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.5.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.5.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.5.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.5.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.5.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.5.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.50.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.50.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.50.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.50.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.50.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.50.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.51.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.51.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.51.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.51.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.51.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.51.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.52.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.52.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.52.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.52.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.52.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.52.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.53.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.53.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.53.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.53.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.53.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.53.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.54.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.54.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.54.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.54.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.54.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.54.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.55.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.55.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.55.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.55.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.55.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.55.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.56.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.56.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.56.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.56.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.56.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.56.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.57.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.57.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.57.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.57.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.57.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.57.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.58.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.58.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.58.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.58.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.58.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.58.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.59.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.59.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.59.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.59.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.59.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.59.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.6.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.6.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.6.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.6.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.6.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.6.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.60.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.60.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.60.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.60.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.60.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.60.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.61.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.61.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.61.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.61.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.61.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.61.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.62.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.62.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.62.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.62.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.62.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.62.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.63.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.63.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.63.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.63.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.63.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.63.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.64.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.64.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.64.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.64.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.64.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.64.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.65.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.65.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.65.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.65.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.65.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.65.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.66.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.66.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.66.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.66.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.66.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.66.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.67.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.67.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.67.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.67.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.67.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.67.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.68.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.68.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.68.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.68.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.68.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.68.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.69.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.69.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.69.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.69.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.69.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.69.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.7.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.7.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.7.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.7.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.7.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.7.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.70.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.70.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.70.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.70.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.70.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.70.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.71.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.71.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.71.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.71.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.71.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.71.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.72.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.72.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.72.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.72.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.72.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.72.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.73.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.73.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.73.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.73.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.73.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.73.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.74.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.74.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.74.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.74.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.74.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.74.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.75.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.75.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.75.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.75.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.75.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.75.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.76.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.76.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.76.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.76.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.76.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.76.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.77.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.77.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.77.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.77.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.77.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.77.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.78.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.78.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.78.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.78.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.78.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.78.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.79.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.79.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.79.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.79.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.79.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.79.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.8.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.8.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.8.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.8.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.8.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.8.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.80.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.80.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.80.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.80.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.80.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.80.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.81.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.81.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.81.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.81.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.81.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.81.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.82.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.82.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.82.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.82.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.82.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.82.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.83.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.83.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.83.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.83.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.83.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.83.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.84.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.84.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.84.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.84.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.84.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.84.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.85.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.85.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.85.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.85.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.85.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.85.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.86.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.86.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.86.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.86.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.86.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.86.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.87.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.87.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.87.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.87.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.87.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.87.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.88.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.88.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.88.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.88.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.88.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.88.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.89.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.89.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.89.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.89.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.89.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.89.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.9.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.9.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.9.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.9.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.9.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.9.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.90.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.90.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.90.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.90.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.90.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.90.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.91.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.91.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.91.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.91.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.91.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.91.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.92.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.92.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.92.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.92.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.92.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.92.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.93.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.93.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.93.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.93.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.93.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.93.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.94.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.94.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.94.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.94.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.94.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.94.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.95.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.95.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.95.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.95.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.95.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.95.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.96.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.96.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.96.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.96.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.96.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.96.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.97.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.97.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.97.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.97.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.97.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.97.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.98.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.98.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.98.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.98.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.98.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.98.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.99.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.99.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.99.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.99.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.99.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.experts.99.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.gate.e_score_correction_bias": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.gate.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.shared_experts.down_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.shared_experts.down_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.shared_experts.gate_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.shared_experts.gate_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.shared_experts.up_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.mlp.shared_experts.up_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.post_attention_layernorm.weight": "model-00072-of-00092.safetensors", + "model.layers.71.self_attn.k_norm.weight": "model-00072-of-00092.safetensors", + "model.layers.71.self_attn.k_proj.bias": "model-00072-of-00092.safetensors", + "model.layers.71.self_attn.k_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.self_attn.k_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.self_attn.o_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.self_attn.o_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.self_attn.q_norm.weight": "model-00072-of-00092.safetensors", + "model.layers.71.self_attn.q_proj.bias": "model-00072-of-00092.safetensors", + "model.layers.71.self_attn.q_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.self_attn.q_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.71.self_attn.v_proj.bias": "model-00072-of-00092.safetensors", + "model.layers.71.self_attn.v_proj.weight": "model-00072-of-00092.safetensors", + "model.layers.71.self_attn.v_proj.weight_scale": "model-00072-of-00092.safetensors", + "model.layers.72.input_layernorm.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.0.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.0.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.0.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.0.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.0.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.0.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.1.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.1.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.1.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.1.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.1.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.1.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.10.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.10.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.10.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.10.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.10.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.10.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.100.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.100.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.100.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.100.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.100.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.100.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.101.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.101.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.101.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.101.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.101.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.101.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.102.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.102.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.102.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.102.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.102.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.102.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.103.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.103.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.103.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.103.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.103.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.103.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.104.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.104.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.104.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.104.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.104.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.104.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.105.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.105.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.105.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.105.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.105.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.105.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.106.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.106.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.106.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.106.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.106.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.106.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.107.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.107.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.107.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.107.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.107.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.107.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.108.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.108.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.108.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.108.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.108.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.108.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.109.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.109.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.109.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.109.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.109.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.109.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.11.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.11.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.11.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.11.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.11.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.11.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.110.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.110.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.110.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.110.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.110.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.110.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.111.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.111.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.111.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.111.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.111.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.111.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.112.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.112.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.112.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.112.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.112.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.112.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.113.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.113.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.113.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.113.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.113.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.113.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.114.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.114.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.114.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.114.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.114.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.114.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.115.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.115.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.115.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.115.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.115.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.115.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.116.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.116.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.116.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.116.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.116.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.116.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.117.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.117.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.117.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.117.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.117.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.117.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.118.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.118.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.118.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.118.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.118.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.118.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.119.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.119.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.119.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.119.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.119.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.119.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.12.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.12.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.12.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.12.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.12.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.12.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.120.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.120.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.120.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.120.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.120.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.120.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.121.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.121.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.121.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.121.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.121.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.121.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.122.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.122.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.122.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.122.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.122.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.122.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.123.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.123.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.123.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.123.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.123.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.123.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.124.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.124.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.124.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.124.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.124.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.124.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.125.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.125.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.125.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.125.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.125.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.125.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.126.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.126.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.126.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.126.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.126.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.126.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.127.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.127.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.127.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.127.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.127.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.127.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.128.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.128.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.128.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.128.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.128.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.128.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.129.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.129.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.129.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.129.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.129.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.129.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.13.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.13.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.13.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.13.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.13.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.13.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.130.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.130.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.130.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.130.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.130.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.130.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.131.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.131.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.131.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.131.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.131.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.131.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.132.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.132.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.132.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.132.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.132.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.132.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.133.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.133.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.133.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.133.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.133.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.133.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.134.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.134.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.134.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.134.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.134.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.134.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.135.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.135.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.135.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.135.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.135.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.135.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.136.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.136.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.136.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.136.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.136.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.136.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.137.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.137.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.137.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.137.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.137.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.137.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.138.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.138.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.138.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.138.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.138.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.138.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.139.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.139.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.139.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.139.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.139.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.139.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.14.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.14.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.14.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.14.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.14.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.14.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.140.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.140.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.140.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.140.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.140.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.140.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.141.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.141.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.141.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.141.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.141.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.141.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.142.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.142.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.142.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.142.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.142.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.142.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.143.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.143.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.143.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.143.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.143.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.143.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.144.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.144.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.144.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.144.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.144.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.144.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.145.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.145.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.145.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.145.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.145.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.145.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.146.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.146.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.146.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.146.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.146.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.146.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.147.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.147.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.147.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.147.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.147.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.147.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.148.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.148.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.148.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.148.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.148.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.148.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.149.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.149.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.149.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.149.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.149.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.149.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.15.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.15.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.15.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.15.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.15.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.15.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.150.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.150.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.150.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.150.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.150.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.150.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.151.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.151.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.151.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.151.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.151.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.151.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.152.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.152.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.152.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.152.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.152.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.152.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.153.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.153.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.153.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.153.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.153.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.153.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.154.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.154.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.154.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.154.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.154.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.154.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.155.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.155.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.155.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.155.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.155.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.155.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.156.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.156.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.156.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.156.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.156.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.156.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.157.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.157.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.157.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.157.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.157.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.157.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.158.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.158.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.158.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.158.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.158.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.158.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.159.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.159.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.159.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.159.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.159.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.159.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.16.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.16.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.16.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.16.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.16.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.16.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.17.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.17.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.17.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.17.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.17.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.17.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.18.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.18.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.18.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.18.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.18.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.18.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.19.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.19.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.19.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.19.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.19.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.19.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.2.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.2.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.2.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.2.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.2.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.2.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.20.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.20.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.20.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.20.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.20.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.20.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.21.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.21.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.21.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.21.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.21.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.21.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.22.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.22.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.22.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.22.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.22.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.22.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.23.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.23.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.23.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.23.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.23.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.23.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.24.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.24.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.24.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.24.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.24.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.24.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.25.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.25.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.25.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.25.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.25.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.25.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.26.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.26.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.26.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.26.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.26.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.26.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.27.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.27.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.27.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.27.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.27.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.27.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.28.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.28.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.28.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.28.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.28.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.28.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.29.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.29.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.29.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.29.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.29.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.29.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.3.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.3.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.3.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.3.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.3.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.3.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.30.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.30.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.30.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.30.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.30.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.30.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.31.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.31.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.31.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.31.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.31.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.31.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.32.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.32.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.32.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.32.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.32.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.32.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.33.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.33.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.33.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.33.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.33.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.33.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.34.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.34.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.34.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.34.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.34.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.34.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.35.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.35.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.35.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.35.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.35.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.35.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.36.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.36.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.36.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.36.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.36.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.36.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.37.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.37.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.37.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.37.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.37.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.37.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.38.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.38.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.38.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.38.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.38.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.38.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.39.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.39.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.39.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.39.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.39.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.39.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.4.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.4.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.4.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.4.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.4.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.4.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.40.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.40.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.40.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.40.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.40.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.40.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.41.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.41.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.41.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.41.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.41.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.41.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.42.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.42.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.42.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.42.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.42.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.42.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.43.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.43.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.43.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.43.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.43.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.43.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.44.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.44.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.44.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.44.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.44.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.44.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.45.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.45.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.45.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.45.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.45.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.45.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.46.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.46.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.46.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.46.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.46.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.46.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.47.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.47.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.47.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.47.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.47.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.47.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.48.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.48.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.48.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.48.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.48.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.48.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.49.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.49.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.49.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.49.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.49.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.49.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.5.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.5.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.5.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.5.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.5.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.5.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.50.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.50.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.50.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.50.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.50.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.50.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.51.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.51.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.51.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.51.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.51.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.51.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.52.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.52.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.52.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.52.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.52.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.52.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.53.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.53.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.53.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.53.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.53.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.53.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.54.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.54.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.54.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.54.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.54.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.54.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.55.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.55.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.55.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.55.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.55.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.55.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.56.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.56.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.56.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.56.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.56.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.56.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.57.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.57.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.57.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.57.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.57.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.57.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.58.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.58.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.58.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.58.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.58.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.58.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.59.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.59.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.59.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.59.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.59.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.59.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.6.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.6.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.6.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.6.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.6.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.6.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.60.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.60.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.60.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.60.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.60.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.60.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.61.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.61.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.61.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.61.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.61.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.61.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.62.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.62.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.62.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.62.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.62.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.62.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.63.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.63.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.63.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.63.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.63.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.63.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.64.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.64.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.64.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.64.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.64.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.64.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.65.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.65.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.65.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.65.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.65.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.65.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.66.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.66.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.66.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.66.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.66.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.66.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.67.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.67.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.67.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.67.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.67.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.67.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.68.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.68.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.68.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.68.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.68.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.68.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.69.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.69.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.69.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.69.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.69.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.69.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.7.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.7.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.7.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.7.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.7.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.7.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.70.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.70.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.70.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.70.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.70.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.70.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.71.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.71.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.71.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.71.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.71.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.71.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.72.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.72.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.72.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.72.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.72.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.72.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.73.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.73.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.73.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.73.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.73.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.73.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.74.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.74.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.74.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.74.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.74.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.74.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.75.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.75.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.75.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.75.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.75.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.75.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.76.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.76.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.76.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.76.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.76.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.76.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.77.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.77.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.77.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.77.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.77.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.77.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.78.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.78.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.78.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.78.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.78.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.78.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.79.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.79.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.79.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.79.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.79.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.79.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.8.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.8.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.8.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.8.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.8.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.8.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.80.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.80.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.80.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.80.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.80.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.80.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.81.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.81.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.81.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.81.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.81.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.81.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.82.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.82.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.82.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.82.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.82.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.82.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.83.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.83.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.83.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.83.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.83.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.83.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.84.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.84.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.84.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.84.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.84.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.84.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.85.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.85.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.85.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.85.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.85.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.85.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.86.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.86.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.86.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.86.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.86.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.86.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.87.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.87.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.87.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.87.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.87.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.87.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.88.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.88.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.88.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.88.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.88.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.88.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.89.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.89.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.89.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.89.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.89.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.89.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.9.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.9.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.9.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.9.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.9.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.9.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.90.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.90.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.90.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.90.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.90.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.90.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.91.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.91.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.91.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.91.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.91.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.91.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.92.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.92.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.92.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.92.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.92.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.92.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.93.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.93.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.93.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.93.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.93.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.93.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.94.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.94.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.94.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.94.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.94.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.94.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.95.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.95.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.95.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.95.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.95.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.95.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.96.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.96.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.96.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.96.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.96.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.96.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.97.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.97.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.97.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.97.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.97.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.97.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.98.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.98.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.98.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.98.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.98.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.98.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.99.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.99.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.99.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.99.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.99.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.experts.99.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.gate.e_score_correction_bias": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.gate.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.shared_experts.down_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.shared_experts.down_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.shared_experts.gate_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.shared_experts.gate_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.shared_experts.up_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.mlp.shared_experts.up_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.post_attention_layernorm.weight": "model-00073-of-00092.safetensors", + "model.layers.72.self_attn.k_norm.weight": "model-00073-of-00092.safetensors", + "model.layers.72.self_attn.k_proj.bias": "model-00073-of-00092.safetensors", + "model.layers.72.self_attn.k_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.self_attn.k_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.self_attn.o_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.self_attn.o_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.self_attn.q_norm.weight": "model-00073-of-00092.safetensors", + "model.layers.72.self_attn.q_proj.bias": "model-00073-of-00092.safetensors", + "model.layers.72.self_attn.q_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.self_attn.q_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.72.self_attn.v_proj.bias": "model-00073-of-00092.safetensors", + "model.layers.72.self_attn.v_proj.weight": "model-00073-of-00092.safetensors", + "model.layers.72.self_attn.v_proj.weight_scale": "model-00073-of-00092.safetensors", + "model.layers.73.input_layernorm.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.0.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.0.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.0.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.0.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.0.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.0.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.1.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.1.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.1.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.1.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.1.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.1.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.10.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.10.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.10.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.10.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.10.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.10.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.100.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.100.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.100.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.100.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.100.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.100.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.101.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.101.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.101.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.101.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.101.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.101.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.102.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.102.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.102.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.102.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.102.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.102.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.103.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.103.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.103.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.103.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.103.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.103.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.104.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.104.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.104.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.104.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.104.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.104.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.105.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.105.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.105.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.105.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.105.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.105.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.106.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.106.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.106.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.106.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.106.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.106.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.107.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.107.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.107.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.107.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.107.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.107.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.108.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.108.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.108.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.108.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.108.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.108.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.109.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.109.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.109.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.109.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.109.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.109.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.11.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.11.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.11.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.11.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.11.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.11.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.110.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.110.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.110.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.110.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.110.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.110.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.111.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.111.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.111.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.111.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.111.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.111.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.112.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.112.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.112.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.112.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.112.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.112.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.113.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.113.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.113.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.113.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.113.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.113.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.114.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.114.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.114.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.114.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.114.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.114.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.115.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.115.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.115.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.115.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.115.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.115.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.116.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.116.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.116.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.116.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.116.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.116.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.117.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.117.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.117.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.117.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.117.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.117.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.118.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.118.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.118.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.118.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.118.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.118.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.119.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.119.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.119.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.119.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.119.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.119.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.12.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.12.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.12.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.12.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.12.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.12.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.120.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.120.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.120.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.120.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.120.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.120.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.121.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.121.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.121.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.121.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.121.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.121.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.122.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.122.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.122.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.122.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.122.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.122.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.123.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.123.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.123.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.123.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.123.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.123.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.124.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.124.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.124.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.124.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.124.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.124.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.125.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.125.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.125.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.125.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.125.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.125.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.126.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.126.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.126.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.126.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.126.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.126.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.127.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.127.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.127.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.127.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.127.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.127.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.128.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.128.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.128.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.128.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.128.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.128.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.129.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.129.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.129.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.129.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.129.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.129.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.13.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.13.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.13.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.13.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.13.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.13.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.130.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.130.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.130.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.130.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.130.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.130.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.131.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.131.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.131.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.131.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.131.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.131.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.132.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.132.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.132.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.132.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.132.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.132.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.133.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.133.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.133.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.133.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.133.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.133.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.134.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.134.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.134.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.134.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.134.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.134.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.135.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.135.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.135.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.135.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.135.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.135.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.136.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.136.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.136.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.136.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.136.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.136.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.137.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.137.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.137.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.137.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.137.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.137.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.138.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.138.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.138.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.138.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.138.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.138.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.139.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.139.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.139.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.139.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.139.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.139.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.14.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.14.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.14.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.14.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.14.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.14.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.140.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.140.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.140.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.140.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.140.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.140.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.141.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.141.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.141.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.141.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.141.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.141.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.142.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.142.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.142.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.142.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.142.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.142.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.143.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.143.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.143.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.143.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.143.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.143.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.144.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.144.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.144.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.144.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.144.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.144.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.145.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.145.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.145.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.145.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.145.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.145.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.146.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.146.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.146.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.146.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.146.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.146.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.147.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.147.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.147.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.147.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.147.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.147.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.148.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.148.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.148.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.148.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.148.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.148.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.149.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.149.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.149.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.149.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.149.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.149.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.15.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.15.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.15.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.15.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.15.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.15.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.150.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.150.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.150.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.150.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.150.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.150.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.151.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.151.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.151.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.151.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.151.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.151.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.152.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.152.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.152.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.152.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.152.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.152.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.153.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.153.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.153.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.153.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.153.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.153.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.154.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.154.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.154.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.154.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.154.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.154.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.155.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.155.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.155.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.155.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.155.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.155.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.156.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.156.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.156.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.156.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.156.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.156.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.157.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.157.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.157.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.157.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.157.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.157.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.158.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.158.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.158.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.158.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.158.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.158.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.159.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.159.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.159.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.159.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.159.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.159.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.16.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.16.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.16.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.16.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.16.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.16.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.17.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.17.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.17.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.17.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.17.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.17.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.18.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.18.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.18.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.18.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.18.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.18.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.19.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.19.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.19.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.19.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.19.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.19.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.2.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.2.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.2.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.2.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.2.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.2.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.20.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.20.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.20.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.20.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.20.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.20.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.21.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.21.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.21.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.21.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.21.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.21.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.22.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.22.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.22.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.22.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.22.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.22.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.23.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.23.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.23.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.23.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.23.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.23.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.24.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.24.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.24.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.24.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.24.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.24.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.25.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.25.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.25.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.25.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.25.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.25.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.26.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.26.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.26.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.26.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.26.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.26.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.27.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.27.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.27.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.27.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.27.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.27.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.28.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.28.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.28.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.28.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.28.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.28.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.29.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.29.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.29.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.29.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.29.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.29.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.3.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.3.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.3.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.3.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.3.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.3.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.30.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.30.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.30.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.30.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.30.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.30.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.31.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.31.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.31.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.31.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.31.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.31.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.32.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.32.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.32.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.32.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.32.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.32.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.33.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.33.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.33.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.33.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.33.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.33.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.34.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.34.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.34.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.34.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.34.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.34.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.35.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.35.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.35.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.35.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.35.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.35.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.36.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.36.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.36.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.36.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.36.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.36.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.37.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.37.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.37.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.37.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.37.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.37.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.38.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.38.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.38.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.38.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.38.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.38.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.39.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.39.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.39.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.39.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.39.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.39.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.4.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.4.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.4.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.4.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.4.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.4.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.40.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.40.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.40.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.40.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.40.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.40.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.41.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.41.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.41.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.41.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.41.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.41.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.42.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.42.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.42.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.42.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.42.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.42.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.43.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.43.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.43.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.43.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.43.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.43.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.44.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.44.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.44.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.44.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.44.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.44.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.45.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.45.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.45.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.45.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.45.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.45.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.46.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.46.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.46.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.46.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.46.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.46.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.47.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.47.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.47.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.47.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.47.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.47.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.48.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.48.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.48.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.48.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.48.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.48.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.49.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.49.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.49.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.49.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.49.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.49.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.5.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.5.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.5.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.5.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.5.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.5.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.50.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.50.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.50.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.50.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.50.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.50.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.51.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.51.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.51.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.51.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.51.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.51.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.52.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.52.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.52.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.52.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.52.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.52.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.53.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.53.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.53.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.53.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.53.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.53.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.54.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.54.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.54.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.54.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.54.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.54.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.55.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.55.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.55.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.55.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.55.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.55.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.56.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.56.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.56.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.56.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.56.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.56.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.57.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.57.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.57.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.57.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.57.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.57.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.58.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.58.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.58.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.58.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.58.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.58.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.59.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.59.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.59.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.59.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.59.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.59.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.6.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.6.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.6.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.6.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.6.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.6.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.60.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.60.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.60.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.60.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.60.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.60.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.61.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.61.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.61.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.61.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.61.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.61.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.62.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.62.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.62.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.62.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.62.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.62.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.63.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.63.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.63.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.63.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.63.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.63.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.64.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.64.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.64.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.64.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.64.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.64.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.65.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.65.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.65.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.65.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.65.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.65.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.66.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.66.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.66.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.66.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.66.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.66.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.67.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.67.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.67.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.67.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.67.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.67.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.68.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.68.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.68.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.68.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.68.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.68.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.69.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.69.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.69.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.69.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.69.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.69.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.7.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.7.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.7.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.7.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.7.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.7.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.70.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.70.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.70.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.70.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.70.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.70.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.71.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.71.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.71.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.71.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.71.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.71.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.72.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.72.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.72.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.72.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.72.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.72.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.73.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.73.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.73.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.73.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.73.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.73.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.74.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.74.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.74.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.74.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.74.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.74.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.75.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.75.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.75.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.75.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.75.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.75.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.76.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.76.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.76.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.76.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.76.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.76.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.77.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.77.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.77.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.77.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.77.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.77.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.78.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.78.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.78.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.78.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.78.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.78.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.79.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.79.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.79.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.79.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.79.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.79.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.8.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.8.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.8.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.8.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.8.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.8.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.80.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.80.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.80.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.80.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.80.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.80.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.81.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.81.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.81.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.81.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.81.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.81.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.82.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.82.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.82.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.82.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.82.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.82.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.83.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.83.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.83.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.83.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.83.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.83.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.84.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.84.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.84.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.84.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.84.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.84.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.85.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.85.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.85.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.85.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.85.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.85.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.86.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.86.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.86.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.86.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.86.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.86.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.87.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.87.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.87.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.87.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.87.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.87.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.88.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.88.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.88.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.88.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.88.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.88.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.89.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.89.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.89.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.89.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.89.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.89.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.9.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.9.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.9.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.9.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.9.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.9.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.90.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.90.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.90.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.90.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.90.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.90.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.91.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.91.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.91.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.91.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.91.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.91.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.92.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.92.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.92.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.92.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.92.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.92.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.93.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.93.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.93.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.93.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.93.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.93.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.94.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.94.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.94.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.94.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.94.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.94.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.95.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.95.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.95.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.95.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.95.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.95.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.96.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.96.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.96.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.96.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.96.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.96.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.97.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.97.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.97.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.97.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.97.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.97.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.98.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.98.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.98.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.98.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.98.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.98.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.99.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.99.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.99.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.99.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.99.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.experts.99.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.gate.e_score_correction_bias": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.gate.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.shared_experts.down_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.shared_experts.down_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.shared_experts.gate_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.shared_experts.gate_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.shared_experts.up_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.mlp.shared_experts.up_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.post_attention_layernorm.weight": "model-00074-of-00092.safetensors", + "model.layers.73.self_attn.k_norm.weight": "model-00074-of-00092.safetensors", + "model.layers.73.self_attn.k_proj.bias": "model-00074-of-00092.safetensors", + "model.layers.73.self_attn.k_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.self_attn.k_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.self_attn.o_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.self_attn.o_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.self_attn.q_norm.weight": "model-00074-of-00092.safetensors", + "model.layers.73.self_attn.q_proj.bias": "model-00074-of-00092.safetensors", + "model.layers.73.self_attn.q_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.self_attn.q_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.73.self_attn.v_proj.bias": "model-00074-of-00092.safetensors", + "model.layers.73.self_attn.v_proj.weight": "model-00074-of-00092.safetensors", + "model.layers.73.self_attn.v_proj.weight_scale": "model-00074-of-00092.safetensors", + "model.layers.74.input_layernorm.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.0.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.0.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.0.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.0.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.0.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.0.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.1.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.1.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.1.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.1.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.1.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.1.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.10.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.10.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.10.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.10.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.10.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.10.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.100.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.100.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.100.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.100.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.100.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.100.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.101.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.101.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.101.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.101.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.101.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.101.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.102.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.102.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.102.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.102.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.102.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.102.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.103.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.103.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.103.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.103.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.103.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.103.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.104.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.104.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.104.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.104.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.104.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.104.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.105.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.105.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.105.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.105.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.105.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.105.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.106.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.106.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.106.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.106.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.106.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.106.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.107.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.107.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.107.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.107.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.107.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.107.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.108.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.108.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.108.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.108.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.108.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.108.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.109.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.109.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.109.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.109.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.109.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.109.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.11.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.11.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.11.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.11.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.11.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.11.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.110.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.110.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.110.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.110.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.110.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.110.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.111.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.111.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.111.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.111.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.111.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.111.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.112.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.112.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.112.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.112.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.112.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.112.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.113.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.113.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.113.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.113.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.113.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.113.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.114.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.114.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.114.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.114.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.114.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.114.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.115.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.115.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.115.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.115.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.115.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.115.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.116.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.116.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.116.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.116.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.116.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.116.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.117.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.117.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.117.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.117.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.117.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.117.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.118.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.118.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.118.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.118.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.118.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.118.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.119.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.119.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.119.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.119.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.119.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.119.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.12.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.12.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.12.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.12.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.12.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.12.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.120.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.120.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.120.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.120.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.120.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.120.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.121.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.121.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.121.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.121.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.121.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.121.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.122.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.122.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.122.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.122.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.122.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.122.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.123.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.123.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.123.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.123.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.123.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.123.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.124.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.124.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.124.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.124.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.124.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.124.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.125.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.125.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.125.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.125.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.125.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.125.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.126.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.126.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.126.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.126.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.126.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.126.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.127.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.127.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.127.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.127.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.127.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.127.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.128.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.128.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.128.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.128.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.128.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.128.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.129.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.129.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.129.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.129.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.129.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.129.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.13.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.13.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.13.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.13.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.13.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.13.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.130.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.130.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.130.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.130.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.130.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.130.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.131.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.131.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.131.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.131.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.131.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.131.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.132.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.132.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.132.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.132.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.132.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.132.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.133.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.133.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.133.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.133.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.133.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.133.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.134.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.134.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.134.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.134.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.134.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.134.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.135.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.135.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.135.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.135.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.135.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.135.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.136.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.136.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.136.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.136.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.136.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.136.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.137.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.137.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.137.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.137.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.137.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.137.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.138.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.138.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.138.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.138.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.138.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.138.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.139.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.139.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.139.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.139.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.139.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.139.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.14.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.14.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.14.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.14.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.14.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.14.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.140.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.140.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.140.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.140.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.140.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.140.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.141.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.141.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.141.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.141.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.141.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.141.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.142.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.142.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.142.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.142.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.142.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.142.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.143.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.143.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.143.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.143.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.143.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.143.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.144.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.144.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.144.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.144.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.144.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.144.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.145.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.145.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.145.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.145.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.145.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.145.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.146.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.146.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.146.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.146.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.146.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.146.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.147.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.147.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.147.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.147.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.147.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.147.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.148.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.148.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.148.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.148.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.148.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.148.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.149.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.149.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.149.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.149.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.149.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.149.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.15.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.15.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.15.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.15.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.15.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.15.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.150.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.150.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.150.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.150.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.150.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.150.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.151.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.151.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.151.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.151.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.151.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.151.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.152.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.152.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.152.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.152.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.152.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.152.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.153.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.153.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.153.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.153.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.153.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.153.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.154.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.154.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.154.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.154.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.154.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.154.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.155.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.155.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.155.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.155.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.155.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.155.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.156.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.156.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.156.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.156.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.156.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.156.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.157.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.157.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.157.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.157.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.157.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.157.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.158.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.158.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.158.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.158.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.158.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.158.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.159.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.159.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.159.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.159.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.159.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.159.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.16.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.16.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.16.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.16.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.16.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.16.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.17.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.17.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.17.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.17.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.17.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.17.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.18.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.18.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.18.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.18.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.18.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.18.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.19.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.19.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.19.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.19.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.19.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.19.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.2.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.2.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.2.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.2.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.2.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.2.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.20.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.20.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.20.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.20.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.20.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.20.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.21.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.21.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.21.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.21.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.21.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.21.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.22.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.22.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.22.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.22.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.22.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.22.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.23.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.23.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.23.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.23.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.23.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.23.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.24.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.24.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.24.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.24.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.24.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.24.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.25.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.25.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.25.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.25.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.25.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.25.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.26.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.26.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.26.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.26.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.26.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.26.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.27.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.27.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.27.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.27.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.27.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.27.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.28.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.28.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.28.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.28.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.28.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.28.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.29.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.29.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.29.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.29.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.29.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.29.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.3.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.3.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.3.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.3.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.3.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.3.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.30.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.30.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.30.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.30.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.30.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.30.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.31.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.31.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.31.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.31.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.31.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.31.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.32.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.32.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.32.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.32.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.32.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.32.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.33.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.33.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.33.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.33.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.33.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.33.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.34.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.34.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.34.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.34.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.34.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.34.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.35.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.35.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.35.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.35.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.35.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.35.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.36.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.36.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.36.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.36.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.36.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.36.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.37.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.37.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.37.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.37.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.37.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.37.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.38.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.38.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.38.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.38.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.38.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.38.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.39.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.39.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.39.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.39.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.39.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.39.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.4.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.4.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.4.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.4.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.4.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.4.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.40.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.40.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.40.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.40.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.40.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.40.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.41.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.41.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.41.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.41.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.41.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.41.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.42.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.42.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.42.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.42.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.42.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.42.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.43.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.43.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.43.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.43.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.43.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.43.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.44.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.44.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.44.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.44.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.44.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.44.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.45.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.45.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.45.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.45.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.45.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.45.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.46.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.46.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.46.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.46.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.46.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.46.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.47.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.47.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.47.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.47.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.47.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.47.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.48.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.48.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.48.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.48.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.48.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.48.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.49.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.49.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.49.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.49.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.49.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.49.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.5.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.5.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.5.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.5.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.5.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.5.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.50.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.50.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.50.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.50.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.50.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.50.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.51.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.51.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.51.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.51.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.51.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.51.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.52.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.52.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.52.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.52.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.52.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.52.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.53.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.53.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.53.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.53.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.53.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.53.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.54.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.54.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.54.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.54.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.54.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.54.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.55.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.55.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.55.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.55.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.55.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.55.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.56.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.56.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.56.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.56.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.56.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.56.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.57.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.57.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.57.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.57.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.57.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.57.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.58.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.58.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.58.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.58.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.58.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.58.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.59.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.59.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.59.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.59.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.59.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.59.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.6.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.6.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.6.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.6.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.6.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.6.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.60.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.60.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.60.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.60.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.60.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.60.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.61.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.61.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.61.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.61.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.61.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.61.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.62.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.62.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.62.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.62.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.62.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.62.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.63.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.63.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.63.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.63.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.63.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.63.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.64.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.64.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.64.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.64.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.64.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.64.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.65.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.65.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.65.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.65.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.65.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.65.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.66.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.66.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.66.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.66.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.66.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.66.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.67.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.67.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.67.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.67.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.67.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.67.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.68.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.68.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.68.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.68.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.68.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.68.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.69.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.69.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.69.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.69.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.69.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.69.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.7.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.7.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.7.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.7.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.7.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.7.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.70.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.70.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.70.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.70.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.70.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.70.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.71.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.71.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.71.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.71.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.71.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.71.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.72.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.72.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.72.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.72.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.72.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.72.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.73.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.73.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.73.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.73.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.73.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.73.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.74.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.74.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.74.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.74.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.74.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.74.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.75.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.75.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.75.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.75.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.75.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.75.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.76.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.76.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.76.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.76.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.76.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.76.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.77.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.77.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.77.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.77.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.77.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.77.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.78.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.78.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.78.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.78.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.78.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.78.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.79.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.79.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.79.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.79.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.79.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.79.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.8.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.8.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.8.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.8.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.8.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.8.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.80.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.80.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.80.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.80.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.80.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.80.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.81.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.81.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.81.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.81.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.81.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.81.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.82.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.82.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.82.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.82.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.82.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.82.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.83.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.83.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.83.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.83.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.83.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.83.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.84.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.84.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.84.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.84.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.84.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.84.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.85.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.85.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.85.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.85.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.85.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.85.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.86.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.86.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.86.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.86.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.86.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.86.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.87.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.87.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.87.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.87.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.87.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.87.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.88.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.88.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.88.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.88.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.88.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.88.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.89.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.89.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.89.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.89.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.89.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.89.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.9.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.9.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.9.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.9.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.9.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.9.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.90.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.90.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.90.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.90.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.90.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.90.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.91.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.91.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.91.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.91.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.91.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.91.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.92.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.92.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.92.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.92.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.92.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.92.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.93.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.93.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.93.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.93.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.93.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.93.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.94.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.94.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.94.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.94.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.94.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.94.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.95.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.95.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.95.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.95.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.95.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.95.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.96.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.96.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.96.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.96.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.96.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.96.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.97.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.97.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.97.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.97.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.97.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.97.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.98.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.98.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.98.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.98.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.98.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.98.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.99.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.99.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.99.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.99.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.99.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.experts.99.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.gate.e_score_correction_bias": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.gate.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.shared_experts.down_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.shared_experts.down_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.shared_experts.gate_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.shared_experts.gate_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.shared_experts.up_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.mlp.shared_experts.up_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.post_attention_layernorm.weight": "model-00075-of-00092.safetensors", + "model.layers.74.self_attn.k_norm.weight": "model-00075-of-00092.safetensors", + "model.layers.74.self_attn.k_proj.bias": "model-00075-of-00092.safetensors", + "model.layers.74.self_attn.k_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.self_attn.k_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.self_attn.o_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.self_attn.o_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.self_attn.q_norm.weight": "model-00075-of-00092.safetensors", + "model.layers.74.self_attn.q_proj.bias": "model-00075-of-00092.safetensors", + "model.layers.74.self_attn.q_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.self_attn.q_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.74.self_attn.v_proj.bias": "model-00075-of-00092.safetensors", + "model.layers.74.self_attn.v_proj.weight": "model-00075-of-00092.safetensors", + "model.layers.74.self_attn.v_proj.weight_scale": "model-00075-of-00092.safetensors", + "model.layers.75.input_layernorm.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.0.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.0.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.0.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.0.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.0.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.0.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.1.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.1.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.1.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.1.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.1.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.1.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.10.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.10.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.10.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.10.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.10.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.10.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.100.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.100.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.100.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.100.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.100.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.100.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.101.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.101.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.101.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.101.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.101.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.101.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.102.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.102.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.102.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.102.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.102.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.102.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.103.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.103.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.103.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.103.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.103.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.103.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.104.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.104.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.104.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.104.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.104.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.104.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.105.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.105.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.105.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.105.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.105.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.105.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.106.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.106.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.106.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.106.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.106.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.106.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.107.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.107.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.107.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.107.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.107.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.107.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.108.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.108.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.108.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.108.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.108.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.108.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.109.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.109.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.109.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.109.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.109.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.109.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.11.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.11.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.11.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.11.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.11.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.11.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.110.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.110.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.110.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.110.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.110.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.110.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.111.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.111.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.111.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.111.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.111.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.111.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.112.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.112.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.112.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.112.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.112.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.112.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.113.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.113.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.113.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.113.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.113.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.113.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.114.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.114.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.114.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.114.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.114.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.114.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.115.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.115.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.115.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.115.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.115.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.115.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.116.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.116.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.116.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.116.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.116.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.116.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.117.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.117.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.117.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.117.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.117.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.117.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.118.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.118.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.118.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.118.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.118.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.118.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.119.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.119.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.119.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.119.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.119.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.119.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.12.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.12.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.12.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.12.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.12.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.12.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.120.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.120.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.120.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.120.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.120.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.120.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.121.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.121.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.121.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.121.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.121.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.121.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.122.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.122.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.122.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.122.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.122.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.122.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.123.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.123.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.123.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.123.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.123.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.123.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.124.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.124.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.124.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.124.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.124.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.124.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.125.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.125.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.125.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.125.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.125.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.125.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.126.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.126.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.126.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.126.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.126.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.126.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.127.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.127.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.127.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.127.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.127.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.127.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.128.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.128.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.128.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.128.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.128.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.128.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.129.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.129.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.129.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.129.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.129.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.129.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.13.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.13.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.13.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.13.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.13.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.13.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.130.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.130.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.130.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.130.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.130.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.130.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.131.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.131.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.131.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.131.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.131.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.131.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.132.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.132.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.132.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.132.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.132.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.132.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.133.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.133.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.133.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.133.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.133.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.133.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.134.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.134.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.134.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.134.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.134.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.134.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.135.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.135.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.135.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.135.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.135.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.135.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.136.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.136.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.136.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.136.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.136.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.136.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.137.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.137.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.137.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.137.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.137.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.137.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.138.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.138.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.138.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.138.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.138.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.138.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.139.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.139.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.139.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.139.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.139.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.139.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.14.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.14.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.14.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.14.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.14.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.14.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.140.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.140.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.140.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.140.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.140.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.140.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.141.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.141.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.141.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.141.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.141.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.141.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.142.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.142.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.142.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.142.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.142.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.142.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.143.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.143.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.143.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.143.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.143.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.143.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.144.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.144.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.144.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.144.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.144.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.144.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.145.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.145.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.145.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.145.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.145.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.145.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.146.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.146.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.146.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.146.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.146.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.146.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.147.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.147.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.147.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.147.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.147.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.147.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.148.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.148.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.148.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.148.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.148.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.148.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.149.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.149.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.149.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.149.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.149.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.149.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.15.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.15.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.15.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.15.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.15.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.15.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.150.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.150.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.150.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.150.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.150.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.150.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.151.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.151.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.151.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.151.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.151.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.151.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.152.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.152.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.152.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.152.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.152.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.152.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.153.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.153.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.153.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.153.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.153.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.153.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.154.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.154.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.154.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.154.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.154.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.154.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.155.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.155.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.155.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.155.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.155.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.155.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.156.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.156.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.156.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.156.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.156.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.156.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.157.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.157.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.157.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.157.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.157.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.157.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.158.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.158.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.158.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.158.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.158.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.158.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.159.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.159.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.159.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.159.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.159.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.159.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.16.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.16.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.16.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.16.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.16.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.16.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.17.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.17.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.17.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.17.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.17.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.17.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.18.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.18.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.18.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.18.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.18.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.18.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.19.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.19.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.19.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.19.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.19.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.19.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.2.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.2.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.2.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.2.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.2.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.2.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.20.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.20.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.20.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.20.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.20.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.20.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.21.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.21.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.21.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.21.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.21.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.21.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.22.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.22.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.22.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.22.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.22.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.22.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.23.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.23.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.23.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.23.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.23.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.23.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.24.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.24.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.24.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.24.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.24.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.24.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.25.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.25.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.25.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.25.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.25.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.25.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.26.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.26.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.26.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.26.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.26.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.26.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.27.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.27.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.27.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.27.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.27.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.27.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.28.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.28.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.28.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.28.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.28.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.28.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.29.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.29.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.29.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.29.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.29.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.29.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.3.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.3.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.3.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.3.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.3.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.3.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.30.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.30.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.30.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.30.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.30.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.30.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.31.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.31.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.31.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.31.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.31.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.31.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.32.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.32.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.32.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.32.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.32.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.32.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.33.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.33.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.33.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.33.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.33.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.33.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.34.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.34.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.34.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.34.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.34.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.34.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.35.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.35.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.35.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.35.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.35.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.35.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.36.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.36.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.36.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.36.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.36.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.36.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.37.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.37.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.37.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.37.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.37.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.37.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.38.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.38.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.38.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.38.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.38.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.38.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.39.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.39.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.39.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.39.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.39.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.39.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.4.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.4.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.4.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.4.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.4.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.4.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.40.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.40.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.40.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.40.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.40.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.40.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.41.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.41.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.41.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.41.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.41.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.41.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.42.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.42.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.42.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.42.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.42.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.42.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.43.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.43.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.43.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.43.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.43.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.43.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.44.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.44.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.44.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.44.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.44.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.44.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.45.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.45.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.45.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.45.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.45.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.45.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.46.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.46.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.46.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.46.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.46.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.46.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.47.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.47.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.47.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.47.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.47.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.47.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.48.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.48.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.48.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.48.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.48.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.48.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.49.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.49.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.49.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.49.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.49.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.49.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.5.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.5.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.5.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.5.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.5.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.5.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.50.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.50.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.50.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.50.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.50.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.50.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.51.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.51.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.51.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.51.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.51.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.51.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.52.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.52.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.52.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.52.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.52.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.52.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.53.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.53.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.53.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.53.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.53.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.53.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.54.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.54.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.54.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.54.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.54.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.54.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.55.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.55.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.55.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.55.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.55.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.55.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.56.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.56.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.56.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.56.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.56.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.56.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.57.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.57.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.57.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.57.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.57.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.57.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.58.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.58.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.58.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.58.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.58.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.58.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.59.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.59.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.59.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.59.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.59.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.59.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.6.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.6.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.6.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.6.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.6.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.6.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.60.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.60.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.60.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.60.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.60.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.60.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.61.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.61.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.61.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.61.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.61.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.61.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.62.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.62.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.62.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.62.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.62.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.62.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.63.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.63.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.63.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.63.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.63.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.63.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.64.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.64.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.64.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.64.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.64.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.64.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.65.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.65.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.65.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.65.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.65.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.65.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.66.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.66.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.66.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.66.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.66.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.66.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.67.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.67.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.67.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.67.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.67.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.67.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.68.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.68.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.68.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.68.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.68.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.68.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.69.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.69.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.69.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.69.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.69.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.69.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.7.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.7.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.7.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.7.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.7.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.7.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.70.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.70.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.70.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.70.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.70.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.70.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.71.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.71.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.71.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.71.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.71.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.71.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.72.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.72.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.72.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.72.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.72.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.72.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.73.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.73.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.73.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.73.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.73.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.73.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.74.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.74.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.74.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.74.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.74.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.74.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.75.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.75.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.75.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.75.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.75.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.75.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.76.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.76.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.76.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.76.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.76.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.76.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.77.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.77.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.77.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.77.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.77.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.77.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.78.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.78.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.78.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.78.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.78.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.78.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.79.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.79.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.79.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.79.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.79.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.79.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.8.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.8.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.8.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.8.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.8.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.8.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.80.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.80.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.80.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.80.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.80.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.80.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.81.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.81.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.81.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.81.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.81.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.81.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.82.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.82.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.82.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.82.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.82.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.82.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.83.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.83.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.83.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.83.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.83.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.83.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.84.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.84.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.84.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.84.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.84.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.84.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.85.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.85.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.85.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.85.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.85.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.85.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.86.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.86.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.86.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.86.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.86.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.86.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.87.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.87.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.87.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.87.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.87.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.87.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.88.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.88.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.88.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.88.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.88.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.88.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.89.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.89.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.89.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.89.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.89.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.89.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.9.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.9.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.9.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.9.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.9.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.9.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.90.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.90.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.90.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.90.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.90.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.90.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.91.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.91.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.91.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.91.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.91.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.91.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.92.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.92.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.92.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.92.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.92.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.92.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.93.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.93.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.93.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.93.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.93.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.93.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.94.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.94.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.94.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.94.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.94.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.94.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.95.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.95.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.95.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.95.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.95.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.95.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.96.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.96.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.96.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.96.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.96.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.96.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.97.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.97.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.97.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.97.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.97.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.97.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.98.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.98.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.98.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.98.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.98.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.98.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.99.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.99.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.99.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.99.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.99.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.experts.99.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.gate.e_score_correction_bias": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.gate.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.shared_experts.down_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.shared_experts.down_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.shared_experts.gate_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.shared_experts.gate_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.shared_experts.up_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.mlp.shared_experts.up_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.post_attention_layernorm.weight": "model-00076-of-00092.safetensors", + "model.layers.75.self_attn.k_norm.weight": "model-00076-of-00092.safetensors", + "model.layers.75.self_attn.k_proj.bias": "model-00076-of-00092.safetensors", + "model.layers.75.self_attn.k_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.self_attn.k_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.self_attn.o_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.self_attn.o_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.self_attn.q_norm.weight": "model-00076-of-00092.safetensors", + "model.layers.75.self_attn.q_proj.bias": "model-00076-of-00092.safetensors", + "model.layers.75.self_attn.q_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.self_attn.q_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.75.self_attn.v_proj.bias": "model-00076-of-00092.safetensors", + "model.layers.75.self_attn.v_proj.weight": "model-00076-of-00092.safetensors", + "model.layers.75.self_attn.v_proj.weight_scale": "model-00076-of-00092.safetensors", + "model.layers.76.input_layernorm.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.0.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.0.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.0.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.0.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.0.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.0.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.1.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.1.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.1.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.1.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.1.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.1.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.10.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.10.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.10.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.10.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.10.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.10.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.100.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.100.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.100.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.100.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.100.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.100.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.101.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.101.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.101.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.101.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.101.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.101.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.102.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.102.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.102.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.102.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.102.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.102.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.103.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.103.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.103.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.103.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.103.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.103.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.104.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.104.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.104.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.104.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.104.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.104.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.105.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.105.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.105.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.105.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.105.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.105.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.106.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.106.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.106.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.106.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.106.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.106.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.107.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.107.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.107.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.107.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.107.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.107.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.108.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.108.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.108.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.108.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.108.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.108.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.109.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.109.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.109.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.109.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.109.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.109.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.11.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.11.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.11.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.11.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.11.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.11.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.110.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.110.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.110.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.110.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.110.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.110.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.111.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.111.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.111.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.111.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.111.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.111.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.112.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.112.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.112.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.112.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.112.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.112.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.113.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.113.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.113.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.113.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.113.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.113.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.114.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.114.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.114.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.114.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.114.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.114.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.115.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.115.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.115.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.115.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.115.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.115.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.116.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.116.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.116.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.116.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.116.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.116.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.117.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.117.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.117.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.117.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.117.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.117.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.118.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.118.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.118.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.118.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.118.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.118.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.119.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.119.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.119.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.119.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.119.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.119.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.12.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.12.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.12.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.12.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.12.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.12.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.120.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.120.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.120.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.120.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.120.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.120.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.121.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.121.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.121.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.121.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.121.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.121.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.122.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.122.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.122.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.122.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.122.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.122.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.123.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.123.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.123.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.123.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.123.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.123.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.124.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.124.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.124.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.124.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.124.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.124.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.125.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.125.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.125.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.125.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.125.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.125.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.126.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.126.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.126.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.126.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.126.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.126.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.127.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.127.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.127.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.127.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.127.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.127.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.128.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.128.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.128.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.128.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.128.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.128.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.129.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.129.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.129.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.129.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.129.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.129.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.13.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.13.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.13.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.13.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.13.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.13.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.130.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.130.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.130.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.130.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.130.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.130.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.131.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.131.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.131.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.131.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.131.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.131.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.132.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.132.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.132.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.132.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.132.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.132.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.133.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.133.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.133.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.133.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.133.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.133.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.134.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.134.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.134.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.134.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.134.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.134.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.135.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.135.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.135.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.135.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.135.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.135.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.136.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.136.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.136.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.136.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.136.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.136.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.137.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.137.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.137.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.137.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.137.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.137.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.138.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.138.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.138.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.138.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.138.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.138.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.139.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.139.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.139.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.139.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.139.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.139.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.14.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.14.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.14.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.14.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.14.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.14.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.140.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.140.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.140.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.140.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.140.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.140.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.141.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.141.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.141.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.141.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.141.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.141.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.142.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.142.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.142.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.142.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.142.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.142.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.143.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.143.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.143.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.143.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.143.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.143.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.144.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.144.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.144.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.144.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.144.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.144.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.145.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.145.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.145.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.145.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.145.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.145.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.146.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.146.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.146.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.146.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.146.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.146.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.147.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.147.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.147.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.147.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.147.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.147.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.148.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.148.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.148.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.148.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.148.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.148.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.149.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.149.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.149.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.149.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.149.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.149.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.15.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.15.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.15.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.15.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.15.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.15.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.150.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.150.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.150.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.150.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.150.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.150.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.151.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.151.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.151.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.151.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.151.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.151.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.152.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.152.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.152.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.152.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.152.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.152.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.153.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.153.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.153.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.153.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.153.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.153.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.154.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.154.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.154.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.154.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.154.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.154.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.155.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.155.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.155.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.155.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.155.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.155.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.156.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.156.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.156.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.156.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.156.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.156.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.157.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.157.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.157.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.157.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.157.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.157.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.158.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.158.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.158.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.158.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.158.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.158.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.159.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.159.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.159.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.159.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.159.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.159.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.16.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.16.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.16.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.16.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.16.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.16.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.17.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.17.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.17.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.17.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.17.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.17.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.18.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.18.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.18.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.18.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.18.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.18.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.19.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.19.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.19.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.19.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.19.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.19.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.2.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.2.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.2.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.2.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.2.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.2.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.20.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.20.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.20.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.20.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.20.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.20.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.21.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.21.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.21.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.21.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.21.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.21.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.22.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.22.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.22.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.22.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.22.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.22.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.23.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.23.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.23.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.23.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.23.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.23.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.24.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.24.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.24.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.24.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.24.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.24.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.25.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.25.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.25.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.25.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.25.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.25.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.26.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.26.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.26.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.26.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.26.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.26.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.27.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.27.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.27.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.27.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.27.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.27.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.28.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.28.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.28.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.28.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.28.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.28.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.29.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.29.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.29.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.29.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.29.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.29.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.3.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.3.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.3.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.3.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.3.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.3.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.30.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.30.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.30.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.30.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.30.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.30.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.31.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.31.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.31.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.31.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.31.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.31.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.32.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.32.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.32.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.32.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.32.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.32.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.33.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.33.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.33.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.33.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.33.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.33.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.34.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.34.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.34.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.34.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.34.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.34.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.35.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.35.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.35.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.35.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.35.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.35.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.36.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.36.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.36.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.36.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.36.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.36.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.37.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.37.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.37.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.37.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.37.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.37.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.38.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.38.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.38.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.38.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.38.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.38.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.39.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.39.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.39.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.39.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.39.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.39.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.4.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.4.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.4.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.4.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.4.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.4.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.40.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.40.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.40.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.40.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.40.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.40.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.41.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.41.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.41.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.41.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.41.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.41.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.42.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.42.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.42.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.42.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.42.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.42.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.43.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.43.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.43.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.43.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.43.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.43.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.44.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.44.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.44.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.44.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.44.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.44.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.45.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.45.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.45.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.45.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.45.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.45.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.46.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.46.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.46.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.46.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.46.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.46.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.47.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.47.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.47.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.47.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.47.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.47.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.48.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.48.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.48.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.48.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.48.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.48.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.49.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.49.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.49.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.49.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.49.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.49.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.5.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.5.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.5.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.5.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.5.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.5.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.50.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.50.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.50.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.50.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.50.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.50.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.51.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.51.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.51.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.51.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.51.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.51.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.52.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.52.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.52.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.52.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.52.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.52.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.53.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.53.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.53.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.53.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.53.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.53.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.54.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.54.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.54.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.54.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.54.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.54.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.55.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.55.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.55.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.55.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.55.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.55.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.56.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.56.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.56.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.56.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.56.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.56.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.57.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.57.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.57.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.57.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.57.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.57.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.58.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.58.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.58.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.58.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.58.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.58.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.59.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.59.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.59.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.59.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.59.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.59.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.6.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.6.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.6.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.6.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.6.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.6.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.60.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.60.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.60.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.60.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.60.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.60.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.61.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.61.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.61.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.61.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.61.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.61.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.62.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.62.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.62.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.62.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.62.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.62.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.63.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.63.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.63.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.63.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.63.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.63.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.64.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.64.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.64.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.64.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.64.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.64.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.65.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.65.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.65.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.65.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.65.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.65.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.66.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.66.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.66.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.66.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.66.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.66.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.67.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.67.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.67.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.67.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.67.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.67.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.68.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.68.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.68.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.68.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.68.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.68.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.69.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.69.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.69.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.69.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.69.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.69.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.7.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.7.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.7.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.7.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.7.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.7.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.70.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.70.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.70.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.70.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.70.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.70.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.71.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.71.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.71.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.71.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.71.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.71.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.72.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.72.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.72.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.72.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.72.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.72.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.73.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.73.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.73.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.73.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.73.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.73.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.74.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.74.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.74.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.74.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.74.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.74.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.75.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.75.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.75.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.75.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.75.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.75.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.76.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.76.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.76.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.76.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.76.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.76.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.77.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.77.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.77.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.77.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.77.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.77.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.78.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.78.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.78.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.78.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.78.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.78.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.79.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.79.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.79.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.79.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.79.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.79.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.8.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.8.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.8.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.8.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.8.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.8.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.80.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.80.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.80.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.80.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.80.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.80.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.81.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.81.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.81.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.81.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.81.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.81.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.82.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.82.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.82.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.82.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.82.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.82.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.83.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.83.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.83.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.83.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.83.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.83.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.84.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.84.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.84.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.84.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.84.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.84.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.85.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.85.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.85.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.85.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.85.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.85.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.86.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.86.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.86.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.86.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.86.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.86.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.87.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.87.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.87.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.87.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.87.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.87.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.88.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.88.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.88.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.88.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.88.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.88.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.89.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.89.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.89.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.89.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.89.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.89.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.9.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.9.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.9.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.9.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.9.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.9.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.90.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.90.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.90.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.90.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.90.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.90.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.91.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.91.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.91.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.91.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.91.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.91.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.92.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.92.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.92.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.92.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.92.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.92.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.93.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.93.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.93.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.93.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.93.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.93.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.94.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.94.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.94.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.94.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.94.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.94.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.95.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.95.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.95.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.95.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.95.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.95.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.96.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.96.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.96.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.96.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.96.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.96.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.97.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.97.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.97.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.97.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.97.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.97.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.98.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.98.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.98.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.98.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.98.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.98.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.99.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.99.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.99.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.99.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.99.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.experts.99.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.gate.e_score_correction_bias": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.gate.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.shared_experts.down_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.shared_experts.down_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.shared_experts.gate_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.shared_experts.gate_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.shared_experts.up_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.mlp.shared_experts.up_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.post_attention_layernorm.weight": "model-00077-of-00092.safetensors", + "model.layers.76.self_attn.k_norm.weight": "model-00077-of-00092.safetensors", + "model.layers.76.self_attn.k_proj.bias": "model-00077-of-00092.safetensors", + "model.layers.76.self_attn.k_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.self_attn.k_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.self_attn.o_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.self_attn.o_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.self_attn.q_norm.weight": "model-00077-of-00092.safetensors", + "model.layers.76.self_attn.q_proj.bias": "model-00077-of-00092.safetensors", + "model.layers.76.self_attn.q_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.self_attn.q_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.76.self_attn.v_proj.bias": "model-00077-of-00092.safetensors", + "model.layers.76.self_attn.v_proj.weight": "model-00077-of-00092.safetensors", + "model.layers.76.self_attn.v_proj.weight_scale": "model-00077-of-00092.safetensors", + "model.layers.77.input_layernorm.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.0.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.0.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.0.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.0.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.0.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.0.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.1.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.1.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.1.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.1.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.1.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.1.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.10.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.10.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.10.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.10.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.10.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.10.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.100.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.100.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.100.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.100.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.100.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.100.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.101.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.101.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.101.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.101.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.101.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.101.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.102.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.102.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.102.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.102.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.102.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.102.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.103.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.103.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.103.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.103.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.103.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.103.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.104.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.104.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.104.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.104.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.104.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.104.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.105.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.105.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.105.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.105.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.105.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.105.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.106.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.106.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.106.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.106.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.106.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.106.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.107.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.107.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.107.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.107.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.107.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.107.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.108.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.108.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.108.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.108.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.108.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.108.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.109.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.109.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.109.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.109.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.109.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.109.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.11.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.11.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.11.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.11.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.11.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.11.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.110.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.110.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.110.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.110.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.110.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.110.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.111.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.111.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.111.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.111.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.111.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.111.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.112.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.112.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.112.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.112.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.112.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.112.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.113.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.113.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.113.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.113.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.113.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.113.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.114.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.114.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.114.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.114.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.114.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.114.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.115.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.115.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.115.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.115.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.115.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.115.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.116.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.116.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.116.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.116.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.116.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.116.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.117.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.117.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.117.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.117.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.117.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.117.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.118.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.118.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.118.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.118.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.118.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.118.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.119.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.119.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.119.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.119.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.119.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.119.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.12.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.12.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.12.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.12.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.12.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.12.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.120.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.120.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.120.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.120.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.120.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.120.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.121.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.121.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.121.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.121.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.121.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.121.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.122.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.122.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.122.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.122.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.122.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.122.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.123.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.123.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.123.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.123.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.123.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.123.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.124.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.124.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.124.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.124.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.124.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.124.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.125.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.125.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.125.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.125.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.125.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.125.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.126.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.126.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.126.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.126.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.126.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.126.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.127.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.127.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.127.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.127.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.127.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.127.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.128.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.128.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.128.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.128.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.128.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.128.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.129.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.129.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.129.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.129.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.129.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.129.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.13.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.13.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.13.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.13.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.13.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.13.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.130.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.130.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.130.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.130.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.130.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.130.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.131.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.131.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.131.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.131.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.131.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.131.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.132.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.132.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.132.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.132.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.132.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.132.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.133.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.133.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.133.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.133.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.133.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.133.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.134.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.134.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.134.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.134.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.134.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.134.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.135.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.135.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.135.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.135.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.135.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.135.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.136.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.136.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.136.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.136.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.136.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.136.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.137.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.137.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.137.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.137.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.137.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.137.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.138.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.138.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.138.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.138.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.138.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.138.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.139.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.139.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.139.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.139.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.139.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.139.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.14.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.14.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.14.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.14.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.14.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.14.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.140.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.140.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.140.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.140.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.140.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.140.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.141.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.141.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.141.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.141.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.141.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.141.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.142.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.142.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.142.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.142.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.142.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.142.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.143.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.143.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.143.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.143.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.143.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.143.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.144.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.144.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.144.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.144.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.144.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.144.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.145.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.145.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.145.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.145.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.145.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.145.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.146.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.146.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.146.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.146.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.146.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.146.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.147.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.147.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.147.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.147.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.147.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.147.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.148.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.148.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.148.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.148.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.148.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.148.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.149.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.149.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.149.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.149.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.149.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.149.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.15.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.15.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.15.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.15.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.15.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.15.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.150.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.150.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.150.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.150.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.150.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.150.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.151.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.151.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.151.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.151.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.151.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.151.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.152.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.152.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.152.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.152.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.152.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.152.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.153.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.153.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.153.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.153.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.153.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.153.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.154.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.154.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.154.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.154.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.154.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.154.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.155.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.155.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.155.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.155.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.155.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.155.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.156.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.156.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.156.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.156.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.156.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.156.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.157.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.157.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.157.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.157.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.157.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.157.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.158.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.158.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.158.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.158.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.158.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.158.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.159.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.159.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.159.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.159.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.159.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.159.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.16.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.16.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.16.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.16.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.16.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.16.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.17.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.17.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.17.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.17.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.17.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.17.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.18.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.18.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.18.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.18.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.18.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.18.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.19.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.19.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.19.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.19.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.19.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.19.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.2.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.2.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.2.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.2.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.2.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.2.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.20.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.20.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.20.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.20.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.20.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.20.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.21.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.21.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.21.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.21.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.21.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.21.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.22.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.22.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.22.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.22.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.22.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.22.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.23.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.23.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.23.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.23.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.23.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.23.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.24.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.24.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.24.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.24.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.24.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.24.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.25.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.25.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.25.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.25.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.25.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.25.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.26.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.26.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.26.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.26.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.26.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.26.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.27.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.27.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.27.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.27.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.27.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.27.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.28.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.28.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.28.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.28.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.28.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.28.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.29.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.29.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.29.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.29.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.29.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.29.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.3.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.3.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.3.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.3.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.3.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.3.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.30.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.30.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.30.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.30.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.30.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.30.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.31.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.31.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.31.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.31.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.31.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.31.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.32.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.32.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.32.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.32.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.32.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.32.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.33.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.33.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.33.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.33.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.33.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.33.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.34.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.34.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.34.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.34.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.34.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.34.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.35.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.35.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.35.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.35.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.35.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.35.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.36.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.36.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.36.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.36.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.36.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.36.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.37.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.37.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.37.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.37.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.37.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.37.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.38.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.38.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.38.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.38.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.38.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.38.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.39.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.39.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.39.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.39.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.39.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.39.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.4.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.4.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.4.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.4.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.4.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.4.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.40.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.40.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.40.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.40.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.40.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.40.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.41.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.41.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.41.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.41.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.41.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.41.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.42.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.42.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.42.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.42.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.42.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.42.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.43.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.43.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.43.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.43.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.43.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.43.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.44.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.44.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.44.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.44.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.44.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.44.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.45.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.45.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.45.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.45.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.45.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.45.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.46.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.46.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.46.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.46.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.46.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.46.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.47.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.47.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.47.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.47.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.47.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.47.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.48.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.48.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.48.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.48.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.48.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.48.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.49.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.49.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.49.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.49.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.49.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.49.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.5.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.5.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.5.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.5.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.5.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.5.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.50.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.50.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.50.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.50.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.50.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.50.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.51.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.51.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.51.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.51.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.51.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.51.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.52.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.52.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.52.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.52.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.52.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.52.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.53.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.53.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.53.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.53.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.53.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.53.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.54.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.54.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.54.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.54.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.54.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.54.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.55.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.55.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.55.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.55.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.55.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.55.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.56.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.56.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.56.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.56.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.56.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.56.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.57.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.57.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.57.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.57.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.57.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.57.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.58.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.58.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.58.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.58.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.58.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.58.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.59.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.59.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.59.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.59.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.59.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.59.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.6.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.6.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.6.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.6.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.6.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.6.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.60.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.60.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.60.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.60.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.60.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.60.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.61.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.61.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.61.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.61.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.61.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.61.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.62.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.62.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.62.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.62.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.62.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.62.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.63.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.63.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.63.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.63.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.63.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.63.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.64.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.64.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.64.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.64.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.64.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.64.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.65.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.65.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.65.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.65.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.65.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.65.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.66.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.66.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.66.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.66.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.66.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.66.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.67.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.67.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.67.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.67.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.67.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.67.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.68.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.68.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.68.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.68.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.68.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.68.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.69.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.69.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.69.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.69.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.69.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.69.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.7.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.7.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.7.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.7.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.7.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.7.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.70.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.70.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.70.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.70.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.70.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.70.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.71.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.71.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.71.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.71.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.71.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.71.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.72.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.72.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.72.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.72.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.72.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.72.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.73.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.73.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.73.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.73.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.73.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.73.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.74.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.74.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.74.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.74.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.74.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.74.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.75.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.75.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.75.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.75.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.75.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.75.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.76.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.76.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.76.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.76.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.76.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.76.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.77.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.77.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.77.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.77.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.77.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.77.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.78.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.78.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.78.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.78.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.78.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.78.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.79.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.79.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.79.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.79.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.79.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.79.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.8.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.8.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.8.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.8.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.8.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.8.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.80.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.80.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.80.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.80.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.80.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.80.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.81.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.81.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.81.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.81.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.81.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.81.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.82.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.82.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.82.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.82.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.82.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.82.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.83.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.83.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.83.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.83.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.83.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.83.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.84.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.84.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.84.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.84.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.84.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.84.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.85.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.85.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.85.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.85.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.85.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.85.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.86.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.86.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.86.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.86.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.86.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.86.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.87.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.87.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.87.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.87.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.87.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.87.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.88.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.88.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.88.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.88.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.88.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.88.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.89.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.89.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.89.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.89.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.89.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.89.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.9.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.9.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.9.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.9.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.9.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.9.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.90.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.90.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.90.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.90.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.90.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.90.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.91.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.91.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.91.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.91.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.91.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.91.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.92.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.92.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.92.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.92.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.92.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.92.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.93.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.93.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.93.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.93.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.93.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.93.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.94.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.94.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.94.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.94.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.94.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.94.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.95.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.95.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.95.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.95.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.95.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.95.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.96.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.96.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.96.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.96.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.96.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.96.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.97.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.97.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.97.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.97.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.97.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.97.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.98.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.98.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.98.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.98.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.98.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.98.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.99.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.99.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.99.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.99.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.99.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.experts.99.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.gate.e_score_correction_bias": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.gate.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.shared_experts.down_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.shared_experts.down_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.shared_experts.gate_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.shared_experts.gate_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.shared_experts.up_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.mlp.shared_experts.up_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.post_attention_layernorm.weight": "model-00078-of-00092.safetensors", + "model.layers.77.self_attn.k_norm.weight": "model-00078-of-00092.safetensors", + "model.layers.77.self_attn.k_proj.bias": "model-00078-of-00092.safetensors", + "model.layers.77.self_attn.k_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.self_attn.k_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.self_attn.o_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.self_attn.o_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.self_attn.q_norm.weight": "model-00078-of-00092.safetensors", + "model.layers.77.self_attn.q_proj.bias": "model-00078-of-00092.safetensors", + "model.layers.77.self_attn.q_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.self_attn.q_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.77.self_attn.v_proj.bias": "model-00078-of-00092.safetensors", + "model.layers.77.self_attn.v_proj.weight": "model-00078-of-00092.safetensors", + "model.layers.77.self_attn.v_proj.weight_scale": "model-00078-of-00092.safetensors", + "model.layers.78.input_layernorm.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.0.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.0.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.0.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.0.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.0.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.0.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.1.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.1.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.1.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.1.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.1.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.1.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.10.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.10.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.10.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.10.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.10.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.10.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.100.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.100.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.100.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.100.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.100.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.100.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.101.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.101.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.101.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.101.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.101.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.101.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.102.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.102.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.102.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.102.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.102.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.102.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.103.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.103.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.103.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.103.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.103.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.103.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.104.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.104.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.104.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.104.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.104.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.104.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.105.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.105.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.105.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.105.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.105.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.105.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.106.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.106.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.106.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.106.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.106.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.106.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.107.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.107.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.107.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.107.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.107.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.107.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.108.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.108.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.108.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.108.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.108.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.108.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.109.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.109.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.109.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.109.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.109.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.109.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.11.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.11.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.11.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.11.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.11.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.11.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.110.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.110.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.110.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.110.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.110.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.110.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.111.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.111.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.111.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.111.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.111.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.111.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.112.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.112.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.112.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.112.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.112.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.112.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.113.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.113.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.113.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.113.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.113.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.113.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.114.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.114.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.114.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.114.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.114.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.114.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.115.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.115.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.115.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.115.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.115.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.115.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.116.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.116.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.116.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.116.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.116.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.116.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.117.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.117.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.117.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.117.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.117.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.117.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.118.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.118.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.118.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.118.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.118.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.118.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.119.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.119.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.119.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.119.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.119.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.119.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.12.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.12.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.12.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.12.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.12.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.12.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.120.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.120.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.120.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.120.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.120.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.120.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.121.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.121.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.121.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.121.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.121.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.121.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.122.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.122.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.122.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.122.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.122.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.122.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.123.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.123.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.123.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.123.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.123.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.123.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.124.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.124.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.124.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.124.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.124.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.124.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.125.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.125.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.125.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.125.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.125.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.125.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.126.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.126.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.126.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.126.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.126.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.126.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.127.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.127.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.127.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.127.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.127.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.127.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.128.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.128.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.128.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.128.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.128.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.128.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.129.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.129.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.129.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.129.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.129.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.129.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.13.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.13.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.13.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.13.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.13.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.13.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.130.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.130.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.130.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.130.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.130.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.130.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.131.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.131.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.131.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.131.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.131.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.131.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.132.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.132.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.132.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.132.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.132.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.132.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.133.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.133.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.133.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.133.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.133.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.133.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.134.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.134.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.134.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.134.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.134.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.134.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.135.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.135.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.135.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.135.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.135.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.135.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.136.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.136.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.136.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.136.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.136.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.136.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.137.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.137.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.137.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.137.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.137.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.137.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.138.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.138.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.138.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.138.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.138.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.138.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.139.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.139.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.139.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.139.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.139.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.139.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.14.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.14.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.14.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.14.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.14.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.14.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.140.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.140.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.140.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.140.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.140.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.140.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.141.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.141.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.141.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.141.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.141.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.141.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.142.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.142.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.142.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.142.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.142.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.142.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.143.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.143.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.143.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.143.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.143.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.143.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.144.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.144.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.144.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.144.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.144.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.144.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.145.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.145.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.145.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.145.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.145.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.145.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.146.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.146.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.146.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.146.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.146.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.146.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.147.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.147.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.147.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.147.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.147.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.147.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.148.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.148.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.148.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.148.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.148.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.148.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.149.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.149.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.149.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.149.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.149.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.149.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.15.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.15.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.15.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.15.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.15.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.15.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.150.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.150.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.150.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.150.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.150.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.150.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.151.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.151.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.151.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.151.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.151.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.151.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.152.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.152.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.152.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.152.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.152.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.152.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.153.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.153.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.153.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.153.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.153.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.153.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.154.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.154.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.154.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.154.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.154.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.154.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.155.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.155.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.155.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.155.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.155.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.155.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.156.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.156.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.156.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.156.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.156.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.156.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.157.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.157.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.157.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.157.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.157.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.157.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.158.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.158.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.158.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.158.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.158.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.158.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.159.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.159.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.159.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.159.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.159.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.159.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.16.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.16.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.16.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.16.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.16.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.16.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.17.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.17.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.17.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.17.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.17.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.17.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.18.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.18.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.18.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.18.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.18.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.18.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.19.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.19.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.19.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.19.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.19.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.19.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.2.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.2.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.2.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.2.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.2.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.2.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.20.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.20.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.20.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.20.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.20.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.20.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.21.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.21.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.21.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.21.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.21.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.21.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.22.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.22.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.22.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.22.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.22.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.22.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.23.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.23.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.23.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.23.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.23.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.23.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.24.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.24.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.24.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.24.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.24.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.24.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.25.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.25.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.25.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.25.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.25.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.25.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.26.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.26.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.26.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.26.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.26.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.26.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.27.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.27.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.27.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.27.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.27.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.27.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.28.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.28.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.28.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.28.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.28.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.28.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.29.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.29.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.29.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.29.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.29.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.29.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.3.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.3.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.3.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.3.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.3.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.3.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.30.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.30.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.30.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.30.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.30.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.30.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.31.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.31.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.31.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.31.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.31.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.31.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.32.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.32.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.32.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.32.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.32.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.32.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.33.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.33.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.33.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.33.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.33.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.33.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.34.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.34.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.34.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.34.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.34.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.34.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.35.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.35.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.35.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.35.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.35.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.35.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.36.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.36.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.36.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.36.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.36.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.36.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.37.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.37.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.37.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.37.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.37.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.37.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.38.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.38.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.38.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.38.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.38.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.38.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.39.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.39.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.39.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.39.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.39.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.39.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.4.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.4.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.4.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.4.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.4.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.4.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.40.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.40.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.40.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.40.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.40.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.40.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.41.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.41.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.41.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.41.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.41.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.41.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.42.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.42.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.42.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.42.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.42.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.42.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.43.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.43.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.43.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.43.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.43.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.43.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.44.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.44.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.44.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.44.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.44.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.44.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.45.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.45.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.45.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.45.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.45.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.45.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.46.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.46.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.46.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.46.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.46.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.46.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.47.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.47.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.47.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.47.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.47.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.47.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.48.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.48.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.48.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.48.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.48.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.48.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.49.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.49.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.49.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.49.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.49.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.49.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.5.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.5.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.5.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.5.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.5.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.5.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.50.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.50.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.50.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.50.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.50.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.50.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.51.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.51.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.51.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.51.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.51.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.51.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.52.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.52.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.52.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.52.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.52.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.52.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.53.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.53.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.53.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.53.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.53.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.53.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.54.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.54.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.54.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.54.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.54.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.54.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.55.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.55.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.55.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.55.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.55.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.55.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.56.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.56.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.56.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.56.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.56.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.56.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.57.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.57.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.57.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.57.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.57.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.57.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.58.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.58.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.58.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.58.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.58.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.58.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.59.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.59.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.59.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.59.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.59.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.59.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.6.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.6.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.6.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.6.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.6.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.6.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.60.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.60.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.60.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.60.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.60.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.60.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.61.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.61.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.61.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.61.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.61.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.61.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.62.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.62.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.62.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.62.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.62.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.62.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.63.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.63.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.63.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.63.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.63.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.63.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.64.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.64.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.64.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.64.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.64.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.64.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.65.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.65.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.65.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.65.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.65.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.65.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.66.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.66.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.66.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.66.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.66.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.66.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.67.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.67.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.67.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.67.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.67.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.67.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.68.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.68.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.68.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.68.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.68.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.68.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.69.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.69.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.69.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.69.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.69.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.69.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.7.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.7.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.7.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.7.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.7.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.7.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.70.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.70.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.70.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.70.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.70.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.70.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.71.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.71.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.71.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.71.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.71.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.71.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.72.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.72.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.72.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.72.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.72.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.72.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.73.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.73.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.73.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.73.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.73.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.73.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.74.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.74.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.74.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.74.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.74.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.74.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.75.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.75.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.75.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.75.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.75.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.75.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.76.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.76.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.76.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.76.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.76.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.76.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.77.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.77.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.77.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.77.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.77.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.77.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.78.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.78.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.78.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.78.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.78.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.78.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.79.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.79.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.79.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.79.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.79.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.79.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.8.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.8.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.8.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.8.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.8.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.8.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.80.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.80.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.80.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.80.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.80.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.80.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.81.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.81.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.81.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.81.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.81.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.81.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.82.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.82.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.82.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.82.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.82.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.82.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.83.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.83.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.83.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.83.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.83.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.83.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.84.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.84.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.84.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.84.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.84.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.84.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.85.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.85.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.85.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.85.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.85.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.85.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.86.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.86.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.86.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.86.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.86.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.86.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.87.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.87.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.87.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.87.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.87.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.87.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.88.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.88.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.88.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.88.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.88.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.88.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.89.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.89.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.89.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.89.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.89.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.89.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.9.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.9.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.9.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.9.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.9.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.9.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.90.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.90.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.90.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.90.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.90.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.90.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.91.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.91.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.91.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.91.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.91.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.91.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.92.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.92.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.92.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.92.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.92.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.92.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.93.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.93.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.93.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.93.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.93.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.93.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.94.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.94.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.94.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.94.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.94.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.94.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.95.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.95.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.95.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.95.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.95.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.95.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.96.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.96.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.96.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.96.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.96.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.96.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.97.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.97.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.97.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.97.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.97.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.97.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.98.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.98.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.98.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.98.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.98.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.98.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.99.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.99.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.99.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.99.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.99.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.experts.99.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.gate.e_score_correction_bias": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.gate.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.shared_experts.down_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.shared_experts.down_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.shared_experts.gate_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.shared_experts.gate_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.shared_experts.up_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.mlp.shared_experts.up_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.post_attention_layernorm.weight": "model-00079-of-00092.safetensors", + "model.layers.78.self_attn.k_norm.weight": "model-00079-of-00092.safetensors", + "model.layers.78.self_attn.k_proj.bias": "model-00079-of-00092.safetensors", + "model.layers.78.self_attn.k_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.self_attn.k_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.self_attn.o_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.self_attn.o_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.self_attn.q_norm.weight": "model-00079-of-00092.safetensors", + "model.layers.78.self_attn.q_proj.bias": "model-00079-of-00092.safetensors", + "model.layers.78.self_attn.q_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.self_attn.q_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.78.self_attn.v_proj.bias": "model-00079-of-00092.safetensors", + "model.layers.78.self_attn.v_proj.weight": "model-00079-of-00092.safetensors", + "model.layers.78.self_attn.v_proj.weight_scale": "model-00079-of-00092.safetensors", + "model.layers.79.input_layernorm.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.0.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.0.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.0.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.0.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.0.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.0.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.1.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.1.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.1.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.1.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.1.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.1.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.10.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.10.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.10.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.10.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.10.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.10.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.100.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.100.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.100.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.100.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.100.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.100.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.101.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.101.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.101.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.101.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.101.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.101.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.102.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.102.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.102.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.102.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.102.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.102.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.103.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.103.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.103.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.103.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.103.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.103.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.104.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.104.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.104.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.104.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.104.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.104.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.105.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.105.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.105.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.105.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.105.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.105.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.106.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.106.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.106.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.106.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.106.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.106.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.107.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.107.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.107.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.107.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.107.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.107.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.108.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.108.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.108.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.108.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.108.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.108.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.109.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.109.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.109.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.109.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.109.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.109.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.11.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.11.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.11.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.11.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.11.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.11.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.110.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.110.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.110.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.110.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.110.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.110.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.111.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.111.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.111.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.111.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.111.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.111.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.112.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.112.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.112.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.112.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.112.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.112.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.113.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.113.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.113.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.113.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.113.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.113.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.114.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.114.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.114.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.114.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.114.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.114.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.115.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.115.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.115.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.115.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.115.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.115.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.116.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.116.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.116.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.116.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.116.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.116.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.117.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.117.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.117.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.117.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.117.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.117.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.118.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.118.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.118.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.118.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.118.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.118.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.119.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.119.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.119.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.119.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.119.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.119.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.12.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.12.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.12.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.12.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.12.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.12.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.120.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.120.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.120.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.120.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.120.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.120.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.121.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.121.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.121.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.121.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.121.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.121.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.122.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.122.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.122.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.122.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.122.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.122.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.123.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.123.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.123.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.123.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.123.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.123.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.124.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.124.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.124.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.124.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.124.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.124.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.125.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.125.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.125.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.125.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.125.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.125.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.126.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.126.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.126.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.126.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.126.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.126.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.127.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.127.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.127.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.127.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.127.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.127.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.128.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.128.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.128.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.128.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.128.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.128.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.129.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.129.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.129.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.129.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.129.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.129.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.13.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.13.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.13.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.13.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.13.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.13.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.130.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.130.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.130.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.130.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.130.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.130.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.131.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.131.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.131.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.131.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.131.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.131.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.132.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.132.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.132.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.132.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.132.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.132.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.133.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.133.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.133.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.133.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.133.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.133.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.134.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.134.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.134.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.134.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.134.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.134.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.135.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.135.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.135.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.135.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.135.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.135.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.136.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.136.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.136.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.136.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.136.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.136.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.137.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.137.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.137.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.137.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.137.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.137.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.138.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.138.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.138.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.138.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.138.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.138.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.139.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.139.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.139.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.139.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.139.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.139.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.14.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.14.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.14.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.14.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.14.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.14.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.140.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.140.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.140.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.140.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.140.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.140.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.141.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.141.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.141.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.141.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.141.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.141.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.142.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.142.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.142.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.142.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.142.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.142.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.143.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.143.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.143.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.143.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.143.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.143.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.144.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.144.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.144.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.144.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.144.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.144.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.145.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.145.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.145.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.145.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.145.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.145.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.146.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.146.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.146.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.146.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.146.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.146.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.147.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.147.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.147.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.147.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.147.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.147.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.148.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.148.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.148.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.148.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.148.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.148.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.149.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.149.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.149.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.149.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.149.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.149.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.15.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.15.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.15.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.15.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.15.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.15.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.150.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.150.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.150.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.150.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.150.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.150.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.151.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.151.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.151.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.151.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.151.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.151.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.152.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.152.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.152.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.152.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.152.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.152.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.153.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.153.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.153.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.153.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.153.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.153.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.154.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.154.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.154.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.154.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.154.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.154.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.155.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.155.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.155.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.155.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.155.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.155.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.156.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.156.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.156.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.156.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.156.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.156.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.157.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.157.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.157.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.157.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.157.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.157.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.158.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.158.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.158.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.158.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.158.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.158.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.159.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.159.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.159.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.159.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.159.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.159.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.16.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.16.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.16.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.16.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.16.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.16.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.17.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.17.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.17.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.17.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.17.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.17.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.18.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.18.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.18.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.18.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.18.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.18.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.19.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.19.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.19.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.19.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.19.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.19.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.2.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.2.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.2.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.2.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.2.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.2.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.20.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.20.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.20.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.20.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.20.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.20.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.21.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.21.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.21.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.21.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.21.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.21.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.22.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.22.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.22.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.22.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.22.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.22.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.23.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.23.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.23.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.23.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.23.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.23.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.24.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.24.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.24.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.24.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.24.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.24.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.25.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.25.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.25.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.25.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.25.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.25.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.26.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.26.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.26.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.26.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.26.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.26.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.27.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.27.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.27.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.27.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.27.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.27.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.28.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.28.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.28.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.28.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.28.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.28.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.29.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.29.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.29.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.29.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.29.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.29.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.3.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.3.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.3.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.3.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.3.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.3.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.30.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.30.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.30.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.30.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.30.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.30.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.31.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.31.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.31.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.31.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.31.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.31.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.32.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.32.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.32.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.32.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.32.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.32.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.33.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.33.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.33.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.33.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.33.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.33.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.34.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.34.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.34.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.34.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.34.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.34.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.35.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.35.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.35.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.35.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.35.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.35.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.36.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.36.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.36.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.36.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.36.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.36.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.37.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.37.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.37.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.37.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.37.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.37.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.38.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.38.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.38.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.38.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.38.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.38.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.39.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.39.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.39.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.39.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.39.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.39.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.4.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.4.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.4.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.4.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.4.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.4.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.40.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.40.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.40.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.40.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.40.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.40.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.41.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.41.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.41.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.41.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.41.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.41.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.42.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.42.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.42.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.42.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.42.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.42.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.43.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.43.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.43.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.43.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.43.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.43.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.44.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.44.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.44.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.44.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.44.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.44.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.45.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.45.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.45.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.45.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.45.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.45.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.46.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.46.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.46.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.46.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.46.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.46.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.47.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.47.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.47.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.47.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.47.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.47.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.48.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.48.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.48.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.48.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.48.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.48.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.49.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.49.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.49.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.49.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.49.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.49.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.5.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.5.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.5.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.5.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.5.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.5.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.50.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.50.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.50.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.50.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.50.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.50.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.51.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.51.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.51.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.51.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.51.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.51.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.52.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.52.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.52.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.52.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.52.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.52.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.53.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.53.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.53.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.53.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.53.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.53.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.54.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.54.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.54.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.54.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.54.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.54.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.55.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.55.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.55.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.55.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.55.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.55.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.56.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.56.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.56.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.56.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.56.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.56.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.57.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.57.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.57.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.57.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.57.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.57.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.58.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.58.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.58.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.58.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.58.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.58.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.59.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.59.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.59.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.59.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.59.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.59.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.6.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.6.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.6.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.6.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.6.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.6.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.60.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.60.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.60.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.60.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.60.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.60.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.61.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.61.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.61.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.61.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.61.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.61.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.62.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.62.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.62.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.62.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.62.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.62.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.63.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.63.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.63.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.63.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.63.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.63.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.64.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.64.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.64.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.64.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.64.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.64.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.65.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.65.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.65.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.65.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.65.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.65.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.66.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.66.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.66.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.66.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.66.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.66.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.67.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.67.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.67.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.67.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.67.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.67.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.68.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.68.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.68.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.68.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.68.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.68.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.69.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.69.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.69.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.69.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.69.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.69.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.7.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.7.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.7.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.7.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.7.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.7.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.70.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.70.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.70.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.70.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.70.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.70.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.71.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.71.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.71.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.71.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.71.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.71.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.72.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.72.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.72.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.72.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.72.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.72.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.73.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.73.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.73.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.73.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.73.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.73.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.74.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.74.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.74.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.74.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.74.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.74.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.75.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.75.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.75.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.75.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.75.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.75.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.76.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.76.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.76.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.76.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.76.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.76.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.77.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.77.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.77.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.77.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.77.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.77.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.78.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.78.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.78.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.78.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.78.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.78.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.79.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.79.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.79.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.79.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.79.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.79.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.8.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.8.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.8.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.8.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.8.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.8.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.80.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.80.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.80.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.80.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.80.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.80.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.81.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.81.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.81.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.81.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.81.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.81.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.82.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.82.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.82.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.82.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.82.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.82.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.83.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.83.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.83.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.83.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.83.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.83.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.84.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.84.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.84.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.84.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.84.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.84.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.85.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.85.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.85.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.85.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.85.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.85.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.86.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.86.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.86.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.86.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.86.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.86.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.87.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.87.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.87.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.87.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.87.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.87.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.88.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.88.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.88.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.88.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.88.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.88.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.89.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.89.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.89.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.89.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.89.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.89.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.9.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.9.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.9.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.9.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.9.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.9.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.90.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.90.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.90.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.90.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.90.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.90.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.91.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.91.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.91.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.91.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.91.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.91.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.92.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.92.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.92.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.92.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.92.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.92.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.93.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.93.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.93.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.93.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.93.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.93.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.94.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.94.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.94.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.94.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.94.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.94.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.95.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.95.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.95.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.95.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.95.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.95.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.96.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.96.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.96.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.96.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.96.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.96.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.97.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.97.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.97.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.97.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.97.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.97.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.98.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.98.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.98.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.98.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.98.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.98.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.99.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.99.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.99.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.99.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.99.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.experts.99.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.gate.e_score_correction_bias": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.gate.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.shared_experts.down_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.shared_experts.down_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.shared_experts.gate_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.shared_experts.gate_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.shared_experts.up_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.mlp.shared_experts.up_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.post_attention_layernorm.weight": "model-00080-of-00092.safetensors", + "model.layers.79.self_attn.k_norm.weight": "model-00080-of-00092.safetensors", + "model.layers.79.self_attn.k_proj.bias": "model-00080-of-00092.safetensors", + "model.layers.79.self_attn.k_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.self_attn.k_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.self_attn.o_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.self_attn.o_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.self_attn.q_norm.weight": "model-00080-of-00092.safetensors", + "model.layers.79.self_attn.q_proj.bias": "model-00080-of-00092.safetensors", + "model.layers.79.self_attn.q_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.self_attn.q_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.79.self_attn.v_proj.bias": "model-00080-of-00092.safetensors", + "model.layers.79.self_attn.v_proj.weight": "model-00080-of-00092.safetensors", + "model.layers.79.self_attn.v_proj.weight_scale": "model-00080-of-00092.safetensors", + "model.layers.80.input_layernorm.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.0.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.0.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.0.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.0.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.0.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.0.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.1.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.1.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.1.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.1.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.1.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.1.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.10.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.10.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.10.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.10.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.10.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.10.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.100.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.100.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.100.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.100.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.100.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.100.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.101.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.101.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.101.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.101.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.101.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.101.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.102.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.102.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.102.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.102.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.102.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.102.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.103.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.103.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.103.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.103.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.103.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.103.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.104.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.104.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.104.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.104.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.104.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.104.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.105.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.105.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.105.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.105.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.105.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.105.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.106.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.106.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.106.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.106.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.106.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.106.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.107.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.107.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.107.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.107.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.107.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.107.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.108.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.108.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.108.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.108.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.108.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.108.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.109.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.109.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.109.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.109.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.109.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.109.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.11.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.11.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.11.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.11.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.11.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.11.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.110.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.110.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.110.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.110.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.110.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.110.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.111.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.111.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.111.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.111.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.111.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.111.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.112.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.112.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.112.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.112.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.112.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.112.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.113.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.113.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.113.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.113.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.113.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.113.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.114.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.114.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.114.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.114.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.114.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.114.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.115.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.115.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.115.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.115.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.115.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.115.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.116.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.116.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.116.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.116.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.116.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.116.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.117.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.117.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.117.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.117.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.117.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.117.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.118.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.118.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.118.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.118.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.118.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.118.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.119.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.119.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.119.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.119.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.119.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.119.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.12.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.12.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.12.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.12.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.12.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.12.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.120.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.120.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.120.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.120.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.120.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.120.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.121.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.121.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.121.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.121.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.121.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.121.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.122.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.122.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.122.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.122.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.122.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.122.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.123.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.123.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.123.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.123.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.123.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.123.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.124.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.124.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.124.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.124.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.124.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.124.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.125.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.125.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.125.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.125.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.125.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.125.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.126.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.126.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.126.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.126.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.126.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.126.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.127.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.127.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.127.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.127.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.127.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.127.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.128.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.128.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.128.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.128.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.128.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.128.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.129.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.129.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.129.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.129.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.129.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.129.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.13.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.13.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.13.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.13.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.13.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.13.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.130.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.130.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.130.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.130.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.130.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.130.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.131.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.131.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.131.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.131.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.131.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.131.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.132.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.132.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.132.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.132.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.132.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.132.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.133.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.133.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.133.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.133.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.133.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.133.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.134.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.134.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.134.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.134.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.134.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.134.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.135.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.135.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.135.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.135.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.135.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.135.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.136.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.136.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.136.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.136.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.136.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.136.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.137.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.137.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.137.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.137.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.137.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.137.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.138.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.138.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.138.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.138.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.138.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.138.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.139.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.139.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.139.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.139.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.139.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.139.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.14.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.14.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.14.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.14.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.14.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.14.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.140.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.140.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.140.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.140.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.140.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.140.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.141.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.141.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.141.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.141.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.141.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.141.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.142.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.142.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.142.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.142.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.142.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.142.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.143.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.143.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.143.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.143.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.143.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.143.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.144.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.144.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.144.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.144.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.144.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.144.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.145.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.145.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.145.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.145.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.145.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.145.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.146.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.146.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.146.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.146.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.146.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.146.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.147.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.147.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.147.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.147.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.147.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.147.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.148.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.148.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.148.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.148.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.148.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.148.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.149.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.149.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.149.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.149.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.149.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.149.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.15.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.15.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.15.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.15.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.15.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.15.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.150.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.150.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.150.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.150.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.150.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.150.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.151.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.151.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.151.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.151.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.151.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.151.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.152.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.152.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.152.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.152.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.152.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.152.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.153.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.153.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.153.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.153.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.153.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.153.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.154.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.154.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.154.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.154.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.154.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.154.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.155.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.155.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.155.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.155.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.155.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.155.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.156.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.156.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.156.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.156.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.156.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.156.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.157.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.157.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.157.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.157.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.157.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.157.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.158.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.158.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.158.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.158.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.158.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.158.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.159.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.159.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.159.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.159.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.159.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.159.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.16.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.16.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.16.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.16.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.16.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.16.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.17.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.17.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.17.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.17.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.17.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.17.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.18.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.18.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.18.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.18.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.18.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.18.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.19.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.19.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.19.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.19.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.19.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.19.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.2.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.2.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.2.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.2.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.2.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.2.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.20.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.20.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.20.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.20.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.20.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.20.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.21.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.21.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.21.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.21.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.21.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.21.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.22.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.22.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.22.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.22.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.22.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.22.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.23.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.23.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.23.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.23.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.23.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.23.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.24.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.24.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.24.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.24.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.24.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.24.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.25.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.25.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.25.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.25.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.25.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.25.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.26.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.26.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.26.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.26.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.26.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.26.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.27.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.27.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.27.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.27.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.27.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.27.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.28.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.28.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.28.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.28.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.28.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.28.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.29.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.29.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.29.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.29.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.29.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.29.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.3.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.3.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.3.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.3.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.3.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.3.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.30.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.30.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.30.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.30.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.30.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.30.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.31.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.31.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.31.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.31.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.31.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.31.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.32.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.32.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.32.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.32.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.32.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.32.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.33.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.33.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.33.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.33.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.33.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.33.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.34.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.34.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.34.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.34.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.34.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.34.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.35.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.35.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.35.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.35.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.35.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.35.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.36.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.36.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.36.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.36.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.36.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.36.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.37.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.37.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.37.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.37.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.37.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.37.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.38.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.38.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.38.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.38.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.38.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.38.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.39.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.39.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.39.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.39.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.39.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.39.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.4.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.4.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.4.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.4.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.4.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.4.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.40.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.40.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.40.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.40.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.40.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.40.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.41.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.41.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.41.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.41.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.41.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.41.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.42.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.42.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.42.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.42.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.42.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.42.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.43.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.43.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.43.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.43.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.43.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.43.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.44.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.44.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.44.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.44.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.44.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.44.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.45.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.45.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.45.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.45.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.45.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.45.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.46.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.46.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.46.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.46.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.46.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.46.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.47.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.47.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.47.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.47.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.47.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.47.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.48.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.48.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.48.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.48.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.48.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.48.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.49.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.49.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.49.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.49.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.49.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.49.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.5.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.5.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.5.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.5.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.5.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.5.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.50.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.50.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.50.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.50.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.50.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.50.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.51.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.51.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.51.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.51.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.51.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.51.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.52.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.52.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.52.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.52.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.52.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.52.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.53.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.53.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.53.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.53.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.53.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.53.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.54.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.54.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.54.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.54.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.54.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.54.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.55.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.55.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.55.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.55.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.55.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.55.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.56.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.56.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.56.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.56.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.56.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.56.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.57.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.57.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.57.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.57.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.57.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.57.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.58.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.58.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.58.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.58.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.58.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.58.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.59.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.59.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.59.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.59.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.59.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.59.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.6.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.6.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.6.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.6.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.6.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.6.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.60.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.60.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.60.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.60.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.60.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.60.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.61.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.61.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.61.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.61.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.61.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.61.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.62.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.62.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.62.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.62.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.62.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.62.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.63.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.63.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.63.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.63.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.63.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.63.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.64.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.64.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.64.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.64.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.64.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.64.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.65.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.65.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.65.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.65.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.65.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.65.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.66.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.66.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.66.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.66.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.66.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.66.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.67.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.67.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.67.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.67.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.67.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.67.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.68.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.68.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.68.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.68.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.68.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.68.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.69.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.69.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.69.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.69.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.69.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.69.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.7.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.7.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.7.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.7.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.7.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.7.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.70.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.70.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.70.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.70.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.70.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.70.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.71.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.71.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.71.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.71.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.71.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.71.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.72.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.72.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.72.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.72.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.72.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.72.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.73.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.73.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.73.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.73.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.73.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.73.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.74.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.74.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.74.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.74.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.74.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.74.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.75.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.75.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.75.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.75.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.75.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.75.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.76.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.76.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.76.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.76.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.76.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.76.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.77.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.77.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.77.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.77.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.77.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.77.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.78.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.78.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.78.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.78.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.78.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.78.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.79.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.79.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.79.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.79.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.79.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.79.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.8.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.8.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.8.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.8.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.8.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.8.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.80.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.80.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.80.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.80.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.80.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.80.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.81.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.81.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.81.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.81.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.81.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.81.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.82.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.82.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.82.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.82.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.82.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.82.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.83.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.83.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.83.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.83.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.83.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.83.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.84.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.84.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.84.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.84.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.84.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.84.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.85.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.85.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.85.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.85.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.85.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.85.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.86.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.86.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.86.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.86.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.86.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.86.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.87.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.87.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.87.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.87.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.87.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.87.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.88.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.88.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.88.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.88.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.88.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.88.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.89.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.89.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.89.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.89.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.89.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.89.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.9.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.9.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.9.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.9.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.9.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.9.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.90.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.90.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.90.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.90.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.90.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.90.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.91.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.91.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.91.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.91.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.91.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.91.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.92.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.92.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.92.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.92.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.92.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.92.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.93.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.93.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.93.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.93.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.93.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.93.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.94.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.94.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.94.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.94.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.94.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.94.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.95.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.95.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.95.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.95.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.95.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.95.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.96.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.96.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.96.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.96.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.96.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.96.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.97.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.97.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.97.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.97.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.97.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.97.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.98.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.98.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.98.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.98.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.98.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.98.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.99.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.99.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.99.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.99.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.99.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.experts.99.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.gate.e_score_correction_bias": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.gate.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.shared_experts.down_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.shared_experts.down_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.shared_experts.gate_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.shared_experts.gate_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.shared_experts.up_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.mlp.shared_experts.up_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.post_attention_layernorm.weight": "model-00081-of-00092.safetensors", + "model.layers.80.self_attn.k_norm.weight": "model-00081-of-00092.safetensors", + "model.layers.80.self_attn.k_proj.bias": "model-00081-of-00092.safetensors", + "model.layers.80.self_attn.k_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.self_attn.k_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.self_attn.o_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.self_attn.o_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.self_attn.q_norm.weight": "model-00081-of-00092.safetensors", + "model.layers.80.self_attn.q_proj.bias": "model-00081-of-00092.safetensors", + "model.layers.80.self_attn.q_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.self_attn.q_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.80.self_attn.v_proj.bias": "model-00081-of-00092.safetensors", + "model.layers.80.self_attn.v_proj.weight": "model-00081-of-00092.safetensors", + "model.layers.80.self_attn.v_proj.weight_scale": "model-00081-of-00092.safetensors", + "model.layers.81.input_layernorm.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.0.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.0.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.0.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.0.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.0.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.0.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.1.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.1.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.1.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.1.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.1.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.1.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.10.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.10.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.10.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.10.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.10.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.10.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.100.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.100.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.100.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.100.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.100.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.100.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.101.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.101.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.101.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.101.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.101.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.101.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.102.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.102.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.102.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.102.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.102.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.102.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.103.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.103.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.103.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.103.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.103.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.103.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.104.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.104.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.104.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.104.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.104.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.104.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.105.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.105.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.105.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.105.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.105.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.105.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.106.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.106.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.106.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.106.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.106.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.106.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.107.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.107.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.107.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.107.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.107.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.107.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.108.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.108.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.108.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.108.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.108.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.108.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.109.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.109.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.109.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.109.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.109.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.109.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.11.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.11.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.11.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.11.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.11.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.11.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.110.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.110.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.110.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.110.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.110.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.110.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.111.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.111.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.111.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.111.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.111.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.111.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.112.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.112.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.112.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.112.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.112.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.112.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.113.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.113.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.113.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.113.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.113.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.113.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.114.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.114.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.114.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.114.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.114.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.114.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.115.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.115.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.115.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.115.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.115.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.115.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.116.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.116.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.116.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.116.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.116.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.116.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.117.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.117.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.117.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.117.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.117.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.117.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.118.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.118.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.118.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.118.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.118.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.118.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.119.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.119.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.119.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.119.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.119.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.119.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.12.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.12.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.12.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.12.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.12.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.12.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.120.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.120.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.120.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.120.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.120.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.120.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.121.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.121.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.121.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.121.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.121.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.121.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.122.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.122.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.122.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.122.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.122.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.122.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.123.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.123.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.123.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.123.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.123.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.123.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.124.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.124.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.124.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.124.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.124.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.124.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.125.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.125.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.125.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.125.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.125.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.125.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.126.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.126.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.126.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.126.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.126.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.126.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.127.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.127.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.127.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.127.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.127.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.127.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.128.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.128.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.128.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.128.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.128.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.128.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.129.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.129.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.129.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.129.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.129.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.129.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.13.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.13.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.13.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.13.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.13.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.13.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.130.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.130.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.130.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.130.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.130.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.130.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.131.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.131.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.131.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.131.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.131.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.131.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.132.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.132.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.132.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.132.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.132.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.132.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.133.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.133.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.133.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.133.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.133.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.133.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.134.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.134.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.134.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.134.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.134.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.134.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.135.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.135.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.135.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.135.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.135.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.135.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.136.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.136.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.136.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.136.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.136.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.136.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.137.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.137.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.137.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.137.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.137.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.137.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.138.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.138.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.138.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.138.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.138.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.138.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.139.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.139.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.139.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.139.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.139.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.139.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.14.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.14.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.14.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.14.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.14.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.14.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.140.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.140.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.140.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.140.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.140.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.140.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.141.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.141.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.141.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.141.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.141.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.141.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.142.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.142.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.142.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.142.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.142.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.142.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.143.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.143.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.143.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.143.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.143.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.143.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.144.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.144.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.144.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.144.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.144.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.144.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.145.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.145.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.145.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.145.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.145.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.145.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.146.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.146.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.146.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.146.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.146.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.146.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.147.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.147.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.147.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.147.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.147.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.147.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.148.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.148.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.148.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.148.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.148.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.148.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.149.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.149.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.149.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.149.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.149.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.149.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.15.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.15.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.15.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.15.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.15.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.15.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.150.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.150.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.150.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.150.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.150.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.150.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.151.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.151.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.151.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.151.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.151.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.151.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.152.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.152.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.152.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.152.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.152.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.152.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.153.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.153.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.153.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.153.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.153.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.153.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.154.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.154.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.154.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.154.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.154.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.154.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.155.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.155.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.155.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.155.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.155.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.155.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.156.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.156.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.156.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.156.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.156.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.156.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.157.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.157.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.157.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.157.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.157.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.157.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.158.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.158.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.158.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.158.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.158.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.158.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.159.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.159.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.159.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.159.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.159.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.159.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.16.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.16.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.16.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.16.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.16.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.16.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.17.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.17.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.17.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.17.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.17.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.17.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.18.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.18.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.18.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.18.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.18.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.18.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.19.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.19.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.19.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.19.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.19.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.19.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.2.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.2.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.2.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.2.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.2.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.2.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.20.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.20.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.20.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.20.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.20.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.20.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.21.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.21.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.21.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.21.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.21.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.21.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.22.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.22.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.22.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.22.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.22.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.22.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.23.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.23.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.23.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.23.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.23.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.23.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.24.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.24.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.24.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.24.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.24.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.24.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.25.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.25.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.25.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.25.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.25.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.25.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.26.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.26.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.26.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.26.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.26.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.26.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.27.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.27.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.27.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.27.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.27.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.27.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.28.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.28.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.28.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.28.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.28.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.28.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.29.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.29.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.29.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.29.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.29.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.29.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.3.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.3.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.3.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.3.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.3.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.3.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.30.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.30.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.30.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.30.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.30.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.30.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.31.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.31.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.31.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.31.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.31.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.31.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.32.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.32.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.32.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.32.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.32.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.32.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.33.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.33.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.33.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.33.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.33.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.33.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.34.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.34.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.34.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.34.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.34.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.34.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.35.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.35.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.35.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.35.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.35.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.35.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.36.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.36.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.36.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.36.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.36.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.36.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.37.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.37.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.37.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.37.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.37.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.37.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.38.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.38.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.38.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.38.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.38.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.38.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.39.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.39.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.39.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.39.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.39.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.39.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.4.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.4.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.4.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.4.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.4.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.4.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.40.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.40.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.40.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.40.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.40.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.40.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.41.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.41.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.41.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.41.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.41.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.41.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.42.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.42.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.42.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.42.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.42.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.42.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.43.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.43.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.43.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.43.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.43.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.43.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.44.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.44.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.44.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.44.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.44.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.44.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.45.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.45.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.45.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.45.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.45.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.45.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.46.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.46.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.46.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.46.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.46.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.46.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.47.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.47.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.47.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.47.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.47.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.47.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.48.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.48.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.48.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.48.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.48.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.48.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.49.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.49.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.49.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.49.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.49.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.49.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.5.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.5.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.5.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.5.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.5.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.5.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.50.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.50.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.50.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.50.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.50.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.50.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.51.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.51.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.51.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.51.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.51.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.51.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.52.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.52.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.52.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.52.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.52.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.52.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.53.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.53.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.53.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.53.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.53.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.53.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.54.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.54.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.54.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.54.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.54.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.54.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.55.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.55.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.55.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.55.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.55.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.55.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.56.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.56.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.56.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.56.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.56.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.56.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.57.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.57.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.57.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.57.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.57.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.57.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.58.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.58.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.58.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.58.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.58.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.58.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.59.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.59.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.59.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.59.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.59.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.59.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.6.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.6.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.6.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.6.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.6.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.6.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.60.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.60.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.60.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.60.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.60.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.60.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.61.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.61.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.61.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.61.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.61.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.61.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.62.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.62.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.62.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.62.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.62.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.62.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.63.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.63.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.63.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.63.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.63.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.63.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.64.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.64.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.64.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.64.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.64.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.64.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.65.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.65.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.65.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.65.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.65.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.65.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.66.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.66.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.66.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.66.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.66.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.66.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.67.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.67.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.67.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.67.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.67.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.67.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.68.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.68.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.68.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.68.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.68.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.68.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.69.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.69.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.69.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.69.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.69.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.69.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.7.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.7.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.7.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.7.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.7.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.7.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.70.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.70.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.70.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.70.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.70.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.70.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.71.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.71.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.71.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.71.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.71.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.71.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.72.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.72.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.72.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.72.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.72.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.72.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.73.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.73.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.73.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.73.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.73.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.73.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.74.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.74.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.74.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.74.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.74.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.74.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.75.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.75.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.75.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.75.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.75.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.75.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.76.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.76.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.76.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.76.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.76.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.76.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.77.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.77.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.77.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.77.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.77.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.77.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.78.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.78.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.78.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.78.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.78.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.78.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.79.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.79.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.79.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.79.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.79.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.79.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.8.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.8.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.8.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.8.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.8.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.8.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.80.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.80.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.80.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.80.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.80.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.80.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.81.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.81.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.81.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.81.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.81.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.81.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.82.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.82.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.82.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.82.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.82.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.82.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.83.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.83.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.83.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.83.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.83.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.83.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.84.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.84.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.84.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.84.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.84.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.84.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.85.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.85.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.85.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.85.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.85.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.85.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.86.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.86.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.86.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.86.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.86.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.86.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.87.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.87.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.87.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.87.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.87.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.87.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.88.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.88.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.88.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.88.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.88.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.88.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.89.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.89.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.89.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.89.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.89.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.89.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.9.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.9.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.9.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.9.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.9.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.9.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.90.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.90.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.90.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.90.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.90.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.90.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.91.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.91.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.91.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.91.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.91.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.91.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.92.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.92.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.92.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.92.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.92.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.92.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.93.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.93.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.93.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.93.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.93.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.93.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.94.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.94.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.94.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.94.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.94.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.94.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.95.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.95.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.95.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.95.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.95.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.95.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.96.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.96.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.96.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.96.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.96.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.96.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.97.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.97.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.97.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.97.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.97.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.97.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.98.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.98.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.98.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.98.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.98.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.98.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.99.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.99.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.99.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.99.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.99.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.experts.99.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.gate.e_score_correction_bias": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.gate.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.shared_experts.down_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.shared_experts.down_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.shared_experts.gate_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.shared_experts.gate_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.shared_experts.up_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.mlp.shared_experts.up_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.post_attention_layernorm.weight": "model-00082-of-00092.safetensors", + "model.layers.81.self_attn.k_norm.weight": "model-00082-of-00092.safetensors", + "model.layers.81.self_attn.k_proj.bias": "model-00082-of-00092.safetensors", + "model.layers.81.self_attn.k_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.self_attn.k_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.self_attn.o_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.self_attn.o_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.self_attn.q_norm.weight": "model-00082-of-00092.safetensors", + "model.layers.81.self_attn.q_proj.bias": "model-00082-of-00092.safetensors", + "model.layers.81.self_attn.q_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.self_attn.q_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.81.self_attn.v_proj.bias": "model-00082-of-00092.safetensors", + "model.layers.81.self_attn.v_proj.weight": "model-00082-of-00092.safetensors", + "model.layers.81.self_attn.v_proj.weight_scale": "model-00082-of-00092.safetensors", + "model.layers.82.input_layernorm.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.0.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.0.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.0.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.0.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.0.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.0.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.1.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.1.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.1.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.1.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.1.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.1.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.10.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.10.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.10.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.10.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.10.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.10.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.100.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.100.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.100.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.100.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.100.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.100.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.101.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.101.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.101.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.101.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.101.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.101.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.102.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.102.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.102.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.102.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.102.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.102.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.103.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.103.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.103.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.103.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.103.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.103.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.104.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.104.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.104.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.104.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.104.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.104.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.105.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.105.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.105.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.105.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.105.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.105.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.106.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.106.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.106.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.106.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.106.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.106.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.107.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.107.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.107.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.107.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.107.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.107.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.108.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.108.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.108.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.108.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.108.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.108.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.109.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.109.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.109.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.109.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.109.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.109.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.11.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.11.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.11.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.11.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.11.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.11.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.110.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.110.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.110.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.110.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.110.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.110.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.111.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.111.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.111.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.111.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.111.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.111.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.112.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.112.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.112.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.112.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.112.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.112.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.113.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.113.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.113.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.113.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.113.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.113.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.114.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.114.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.114.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.114.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.114.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.114.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.115.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.115.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.115.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.115.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.115.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.115.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.116.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.116.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.116.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.116.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.116.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.116.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.117.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.117.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.117.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.117.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.117.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.117.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.118.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.118.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.118.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.118.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.118.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.118.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.119.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.119.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.119.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.119.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.119.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.119.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.12.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.12.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.12.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.12.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.12.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.12.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.120.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.120.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.120.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.120.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.120.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.120.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.121.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.121.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.121.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.121.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.121.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.121.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.122.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.122.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.122.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.122.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.122.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.122.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.123.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.123.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.123.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.123.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.123.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.123.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.124.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.124.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.124.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.124.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.124.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.124.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.125.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.125.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.125.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.125.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.125.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.125.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.126.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.126.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.126.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.126.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.126.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.126.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.127.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.127.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.127.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.127.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.127.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.127.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.128.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.128.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.128.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.128.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.128.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.128.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.129.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.129.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.129.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.129.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.129.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.129.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.13.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.13.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.13.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.13.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.13.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.13.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.130.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.130.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.130.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.130.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.130.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.130.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.131.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.131.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.131.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.131.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.131.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.131.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.132.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.132.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.132.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.132.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.132.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.132.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.133.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.133.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.133.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.133.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.133.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.133.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.134.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.134.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.134.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.134.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.134.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.134.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.135.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.135.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.135.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.135.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.135.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.135.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.136.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.136.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.136.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.136.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.136.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.136.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.137.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.137.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.137.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.137.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.137.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.137.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.138.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.138.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.138.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.138.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.138.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.138.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.139.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.139.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.139.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.139.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.139.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.139.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.14.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.14.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.14.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.14.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.14.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.14.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.140.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.140.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.140.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.140.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.140.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.140.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.141.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.141.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.141.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.141.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.141.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.141.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.142.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.142.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.142.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.142.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.142.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.142.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.143.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.143.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.143.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.143.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.143.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.143.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.144.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.144.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.144.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.144.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.144.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.144.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.145.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.145.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.145.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.145.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.145.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.145.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.146.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.146.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.146.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.146.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.146.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.146.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.147.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.147.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.147.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.147.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.147.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.147.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.148.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.148.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.148.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.148.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.148.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.148.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.149.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.149.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.149.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.149.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.149.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.149.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.15.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.15.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.15.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.15.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.15.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.15.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.150.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.150.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.150.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.150.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.150.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.150.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.151.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.151.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.151.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.151.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.151.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.151.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.152.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.152.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.152.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.152.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.152.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.152.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.153.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.153.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.153.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.153.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.153.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.153.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.154.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.154.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.154.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.154.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.154.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.154.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.155.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.155.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.155.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.155.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.155.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.155.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.156.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.156.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.156.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.156.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.156.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.156.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.157.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.157.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.157.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.157.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.157.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.157.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.158.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.158.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.158.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.158.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.158.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.158.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.159.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.159.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.159.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.159.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.159.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.159.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.16.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.16.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.16.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.16.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.16.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.16.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.17.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.17.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.17.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.17.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.17.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.17.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.18.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.18.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.18.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.18.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.18.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.18.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.19.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.19.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.19.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.19.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.19.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.19.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.2.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.2.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.2.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.2.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.2.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.2.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.20.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.20.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.20.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.20.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.20.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.20.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.21.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.21.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.21.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.21.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.21.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.21.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.22.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.22.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.22.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.22.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.22.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.22.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.23.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.23.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.23.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.23.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.23.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.23.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.24.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.24.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.24.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.24.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.24.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.24.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.25.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.25.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.25.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.25.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.25.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.25.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.26.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.26.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.26.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.26.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.26.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.26.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.27.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.27.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.27.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.27.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.27.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.27.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.28.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.28.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.28.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.28.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.28.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.28.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.29.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.29.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.29.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.29.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.29.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.29.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.3.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.3.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.3.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.3.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.3.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.3.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.30.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.30.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.30.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.30.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.30.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.30.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.31.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.31.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.31.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.31.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.31.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.31.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.32.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.32.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.32.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.32.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.32.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.32.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.33.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.33.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.33.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.33.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.33.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.33.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.34.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.34.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.34.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.34.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.34.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.34.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.35.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.35.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.35.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.35.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.35.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.35.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.36.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.36.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.36.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.36.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.36.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.36.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.37.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.37.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.37.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.37.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.37.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.37.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.38.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.38.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.38.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.38.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.38.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.38.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.39.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.39.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.39.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.39.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.39.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.39.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.4.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.4.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.4.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.4.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.4.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.4.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.40.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.40.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.40.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.40.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.40.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.40.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.41.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.41.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.41.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.41.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.41.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.41.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.42.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.42.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.42.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.42.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.42.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.42.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.43.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.43.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.43.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.43.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.43.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.43.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.44.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.44.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.44.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.44.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.44.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.44.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.45.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.45.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.45.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.45.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.45.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.45.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.46.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.46.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.46.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.46.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.46.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.46.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.47.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.47.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.47.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.47.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.47.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.47.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.48.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.48.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.48.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.48.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.48.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.48.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.49.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.49.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.49.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.49.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.49.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.49.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.5.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.5.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.5.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.5.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.5.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.5.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.50.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.50.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.50.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.50.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.50.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.50.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.51.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.51.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.51.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.51.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.51.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.51.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.52.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.52.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.52.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.52.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.52.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.52.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.53.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.53.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.53.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.53.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.53.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.53.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.54.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.54.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.54.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.54.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.54.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.54.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.55.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.55.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.55.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.55.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.55.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.55.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.56.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.56.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.56.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.56.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.56.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.56.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.57.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.57.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.57.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.57.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.57.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.57.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.58.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.58.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.58.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.58.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.58.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.58.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.59.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.59.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.59.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.59.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.59.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.59.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.6.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.6.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.6.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.6.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.6.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.6.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.60.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.60.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.60.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.60.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.60.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.60.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.61.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.61.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.61.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.61.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.61.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.61.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.62.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.62.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.62.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.62.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.62.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.62.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.63.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.63.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.63.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.63.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.63.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.63.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.64.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.64.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.64.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.64.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.64.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.64.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.65.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.65.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.65.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.65.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.65.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.65.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.66.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.66.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.66.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.66.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.66.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.66.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.67.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.67.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.67.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.67.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.67.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.67.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.68.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.68.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.68.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.68.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.68.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.68.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.69.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.69.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.69.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.69.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.69.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.69.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.7.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.7.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.7.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.7.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.7.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.7.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.70.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.70.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.70.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.70.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.70.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.70.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.71.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.71.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.71.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.71.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.71.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.71.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.72.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.72.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.72.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.72.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.72.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.72.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.73.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.73.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.73.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.73.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.73.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.73.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.74.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.74.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.74.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.74.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.74.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.74.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.75.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.75.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.75.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.75.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.75.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.75.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.76.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.76.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.76.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.76.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.76.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.76.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.77.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.77.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.77.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.77.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.77.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.77.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.78.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.78.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.78.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.78.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.78.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.78.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.79.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.79.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.79.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.79.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.79.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.79.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.8.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.8.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.8.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.8.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.8.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.8.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.80.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.80.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.80.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.80.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.80.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.80.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.81.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.81.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.81.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.81.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.81.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.81.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.82.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.82.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.82.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.82.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.82.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.82.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.83.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.83.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.83.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.83.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.83.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.83.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.84.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.84.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.84.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.84.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.84.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.84.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.85.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.85.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.85.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.85.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.85.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.85.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.86.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.86.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.86.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.86.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.86.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.86.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.87.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.87.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.87.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.87.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.87.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.87.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.88.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.88.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.88.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.88.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.88.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.88.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.89.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.89.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.89.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.89.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.89.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.89.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.9.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.9.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.9.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.9.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.9.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.9.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.90.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.90.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.90.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.90.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.90.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.90.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.91.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.91.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.91.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.91.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.91.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.91.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.92.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.92.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.92.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.92.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.92.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.92.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.93.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.93.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.93.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.93.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.93.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.93.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.94.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.94.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.94.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.94.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.94.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.94.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.95.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.95.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.95.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.95.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.95.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.95.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.96.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.96.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.96.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.96.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.96.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.96.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.97.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.97.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.97.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.97.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.97.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.97.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.98.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.98.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.98.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.98.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.98.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.98.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.99.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.99.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.99.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.99.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.99.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.experts.99.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.gate.e_score_correction_bias": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.gate.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.shared_experts.down_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.shared_experts.down_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.shared_experts.gate_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.shared_experts.gate_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.shared_experts.up_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.mlp.shared_experts.up_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.post_attention_layernorm.weight": "model-00083-of-00092.safetensors", + "model.layers.82.self_attn.k_norm.weight": "model-00083-of-00092.safetensors", + "model.layers.82.self_attn.k_proj.bias": "model-00083-of-00092.safetensors", + "model.layers.82.self_attn.k_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.self_attn.k_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.self_attn.o_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.self_attn.o_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.self_attn.q_norm.weight": "model-00083-of-00092.safetensors", + "model.layers.82.self_attn.q_proj.bias": "model-00083-of-00092.safetensors", + "model.layers.82.self_attn.q_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.self_attn.q_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.82.self_attn.v_proj.bias": "model-00083-of-00092.safetensors", + "model.layers.82.self_attn.v_proj.weight": "model-00083-of-00092.safetensors", + "model.layers.82.self_attn.v_proj.weight_scale": "model-00083-of-00092.safetensors", + "model.layers.83.input_layernorm.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.0.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.0.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.0.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.0.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.0.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.0.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.1.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.1.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.1.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.1.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.1.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.1.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.10.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.10.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.10.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.10.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.10.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.10.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.100.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.100.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.100.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.100.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.100.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.100.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.101.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.101.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.101.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.101.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.101.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.101.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.102.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.102.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.102.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.102.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.102.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.102.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.103.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.103.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.103.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.103.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.103.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.103.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.104.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.104.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.104.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.104.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.104.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.104.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.105.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.105.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.105.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.105.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.105.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.105.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.106.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.106.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.106.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.106.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.106.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.106.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.107.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.107.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.107.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.107.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.107.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.107.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.108.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.108.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.108.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.108.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.108.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.108.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.109.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.109.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.109.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.109.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.109.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.109.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.11.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.11.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.11.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.11.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.11.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.11.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.110.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.110.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.110.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.110.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.110.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.110.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.111.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.111.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.111.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.111.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.111.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.111.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.112.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.112.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.112.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.112.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.112.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.112.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.113.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.113.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.113.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.113.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.113.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.113.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.114.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.114.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.114.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.114.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.114.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.114.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.115.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.115.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.115.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.115.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.115.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.115.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.116.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.116.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.116.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.116.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.116.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.116.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.117.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.117.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.117.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.117.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.117.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.117.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.118.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.118.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.118.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.118.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.118.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.118.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.119.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.119.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.119.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.119.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.119.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.119.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.12.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.12.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.12.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.12.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.12.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.12.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.120.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.120.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.120.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.120.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.120.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.120.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.121.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.121.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.121.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.121.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.121.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.121.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.122.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.122.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.122.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.122.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.122.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.122.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.123.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.123.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.123.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.123.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.123.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.123.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.124.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.124.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.124.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.124.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.124.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.124.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.125.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.125.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.125.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.125.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.125.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.125.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.126.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.126.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.126.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.126.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.126.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.126.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.127.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.127.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.127.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.127.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.127.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.127.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.128.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.128.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.128.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.128.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.128.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.128.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.129.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.129.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.129.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.129.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.129.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.129.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.13.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.13.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.13.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.13.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.13.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.13.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.130.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.130.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.130.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.130.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.130.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.130.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.131.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.131.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.131.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.131.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.131.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.131.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.132.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.132.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.132.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.132.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.132.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.132.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.133.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.133.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.133.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.133.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.133.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.133.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.134.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.134.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.134.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.134.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.134.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.134.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.135.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.135.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.135.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.135.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.135.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.135.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.136.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.136.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.136.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.136.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.136.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.136.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.137.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.137.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.137.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.137.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.137.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.137.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.138.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.138.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.138.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.138.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.138.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.138.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.139.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.139.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.139.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.139.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.139.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.139.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.14.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.14.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.14.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.14.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.14.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.14.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.140.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.140.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.140.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.140.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.140.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.140.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.141.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.141.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.141.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.141.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.141.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.141.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.142.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.142.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.142.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.142.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.142.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.142.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.143.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.143.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.143.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.143.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.143.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.143.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.144.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.144.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.144.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.144.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.144.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.144.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.145.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.145.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.145.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.145.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.145.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.145.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.146.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.146.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.146.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.146.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.146.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.146.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.147.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.147.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.147.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.147.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.147.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.147.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.148.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.148.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.148.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.148.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.148.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.148.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.149.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.149.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.149.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.149.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.149.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.149.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.15.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.15.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.15.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.15.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.15.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.15.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.150.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.150.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.150.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.150.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.150.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.150.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.151.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.151.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.151.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.151.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.151.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.151.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.152.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.152.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.152.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.152.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.152.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.152.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.153.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.153.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.153.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.153.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.153.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.153.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.154.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.154.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.154.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.154.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.154.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.154.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.155.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.155.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.155.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.155.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.155.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.155.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.156.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.156.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.156.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.156.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.156.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.156.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.157.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.157.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.157.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.157.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.157.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.157.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.158.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.158.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.158.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.158.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.158.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.158.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.159.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.159.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.159.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.159.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.159.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.159.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.16.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.16.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.16.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.16.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.16.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.16.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.17.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.17.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.17.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.17.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.17.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.17.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.18.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.18.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.18.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.18.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.18.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.18.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.19.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.19.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.19.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.19.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.19.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.19.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.2.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.2.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.2.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.2.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.2.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.2.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.20.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.20.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.20.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.20.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.20.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.20.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.21.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.21.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.21.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.21.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.21.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.21.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.22.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.22.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.22.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.22.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.22.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.22.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.23.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.23.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.23.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.23.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.23.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.23.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.24.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.24.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.24.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.24.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.24.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.24.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.25.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.25.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.25.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.25.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.25.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.25.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.26.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.26.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.26.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.26.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.26.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.26.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.27.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.27.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.27.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.27.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.27.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.27.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.28.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.28.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.28.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.28.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.28.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.28.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.29.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.29.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.29.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.29.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.29.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.29.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.3.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.3.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.3.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.3.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.3.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.3.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.30.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.30.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.30.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.30.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.30.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.30.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.31.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.31.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.31.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.31.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.31.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.31.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.32.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.32.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.32.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.32.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.32.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.32.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.33.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.33.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.33.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.33.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.33.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.33.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.34.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.34.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.34.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.34.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.34.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.34.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.35.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.35.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.35.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.35.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.35.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.35.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.36.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.36.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.36.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.36.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.36.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.36.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.37.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.37.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.37.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.37.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.37.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.37.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.38.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.38.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.38.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.38.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.38.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.38.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.39.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.39.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.39.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.39.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.39.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.39.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.4.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.4.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.4.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.4.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.4.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.4.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.40.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.40.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.40.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.40.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.40.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.40.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.41.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.41.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.41.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.41.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.41.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.41.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.42.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.42.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.42.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.42.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.42.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.42.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.43.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.43.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.43.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.43.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.43.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.43.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.44.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.44.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.44.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.44.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.44.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.44.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.45.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.45.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.45.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.45.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.45.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.45.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.46.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.46.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.46.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.46.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.46.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.46.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.47.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.47.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.47.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.47.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.47.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.47.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.48.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.48.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.48.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.48.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.48.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.48.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.49.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.49.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.49.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.49.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.49.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.49.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.5.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.5.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.5.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.5.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.5.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.5.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.50.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.50.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.50.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.50.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.50.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.50.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.51.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.51.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.51.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.51.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.51.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.51.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.52.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.52.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.52.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.52.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.52.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.52.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.53.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.53.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.53.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.53.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.53.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.53.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.54.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.54.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.54.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.54.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.54.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.54.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.55.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.55.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.55.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.55.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.55.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.55.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.56.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.56.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.56.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.56.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.56.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.56.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.57.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.57.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.57.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.57.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.57.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.57.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.58.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.58.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.58.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.58.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.58.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.58.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.59.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.59.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.59.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.59.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.59.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.59.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.6.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.6.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.6.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.6.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.6.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.6.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.60.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.60.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.60.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.60.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.60.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.60.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.61.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.61.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.61.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.61.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.61.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.61.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.62.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.62.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.62.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.62.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.62.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.62.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.63.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.63.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.63.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.63.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.63.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.63.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.64.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.64.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.64.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.64.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.64.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.64.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.65.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.65.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.65.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.65.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.65.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.65.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.66.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.66.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.66.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.66.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.66.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.66.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.67.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.67.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.67.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.67.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.67.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.67.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.68.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.68.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.68.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.68.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.68.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.68.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.69.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.69.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.69.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.69.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.69.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.69.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.7.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.7.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.7.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.7.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.7.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.7.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.70.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.70.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.70.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.70.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.70.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.70.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.71.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.71.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.71.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.71.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.71.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.71.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.72.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.72.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.72.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.72.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.72.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.72.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.73.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.73.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.73.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.73.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.73.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.73.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.74.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.74.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.74.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.74.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.74.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.74.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.75.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.75.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.75.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.75.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.75.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.75.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.76.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.76.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.76.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.76.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.76.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.76.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.77.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.77.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.77.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.77.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.77.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.77.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.78.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.78.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.78.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.78.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.78.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.78.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.79.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.79.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.79.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.79.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.79.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.79.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.8.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.8.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.8.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.8.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.8.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.8.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.80.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.80.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.80.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.80.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.80.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.80.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.81.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.81.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.81.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.81.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.81.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.81.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.82.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.82.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.82.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.82.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.82.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.82.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.83.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.83.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.83.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.83.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.83.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.83.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.84.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.84.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.84.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.84.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.84.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.84.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.85.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.85.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.85.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.85.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.85.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.85.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.86.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.86.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.86.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.86.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.86.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.86.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.87.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.87.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.87.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.87.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.87.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.87.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.88.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.88.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.88.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.88.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.88.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.88.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.89.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.89.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.89.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.89.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.89.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.89.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.9.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.9.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.9.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.9.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.9.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.9.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.90.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.90.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.90.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.90.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.90.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.90.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.91.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.91.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.91.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.91.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.91.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.91.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.92.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.92.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.92.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.92.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.92.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.92.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.93.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.93.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.93.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.93.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.93.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.93.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.94.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.94.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.94.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.94.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.94.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.94.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.95.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.95.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.95.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.95.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.95.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.95.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.96.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.96.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.96.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.96.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.96.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.96.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.97.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.97.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.97.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.97.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.97.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.97.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.98.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.98.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.98.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.98.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.98.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.98.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.99.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.99.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.99.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.99.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.99.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.experts.99.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.gate.e_score_correction_bias": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.gate.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.shared_experts.down_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.shared_experts.down_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.shared_experts.gate_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.shared_experts.gate_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.shared_experts.up_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.mlp.shared_experts.up_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.post_attention_layernorm.weight": "model-00084-of-00092.safetensors", + "model.layers.83.self_attn.k_norm.weight": "model-00084-of-00092.safetensors", + "model.layers.83.self_attn.k_proj.bias": "model-00084-of-00092.safetensors", + "model.layers.83.self_attn.k_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.self_attn.k_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.self_attn.o_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.self_attn.o_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.self_attn.q_norm.weight": "model-00084-of-00092.safetensors", + "model.layers.83.self_attn.q_proj.bias": "model-00084-of-00092.safetensors", + "model.layers.83.self_attn.q_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.self_attn.q_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.83.self_attn.v_proj.bias": "model-00084-of-00092.safetensors", + "model.layers.83.self_attn.v_proj.weight": "model-00084-of-00092.safetensors", + "model.layers.83.self_attn.v_proj.weight_scale": "model-00084-of-00092.safetensors", + "model.layers.84.input_layernorm.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.0.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.0.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.0.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.0.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.0.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.0.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.1.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.1.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.1.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.1.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.1.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.1.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.10.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.10.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.10.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.10.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.10.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.10.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.100.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.100.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.100.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.100.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.100.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.100.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.101.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.101.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.101.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.101.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.101.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.101.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.102.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.102.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.102.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.102.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.102.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.102.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.103.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.103.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.103.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.103.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.103.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.103.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.104.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.104.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.104.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.104.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.104.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.104.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.105.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.105.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.105.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.105.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.105.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.105.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.106.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.106.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.106.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.106.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.106.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.106.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.107.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.107.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.107.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.107.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.107.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.107.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.108.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.108.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.108.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.108.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.108.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.108.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.109.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.109.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.109.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.109.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.109.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.109.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.11.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.11.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.11.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.11.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.11.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.11.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.110.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.110.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.110.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.110.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.110.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.110.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.111.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.111.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.111.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.111.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.111.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.111.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.112.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.112.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.112.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.112.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.112.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.112.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.113.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.113.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.113.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.113.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.113.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.113.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.114.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.114.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.114.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.114.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.114.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.114.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.115.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.115.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.115.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.115.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.115.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.115.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.116.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.116.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.116.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.116.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.116.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.116.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.117.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.117.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.117.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.117.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.117.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.117.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.118.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.118.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.118.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.118.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.118.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.118.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.119.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.119.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.119.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.119.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.119.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.119.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.12.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.12.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.12.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.12.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.12.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.12.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.120.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.120.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.120.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.120.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.120.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.120.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.121.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.121.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.121.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.121.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.121.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.121.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.122.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.122.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.122.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.122.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.122.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.122.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.123.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.123.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.123.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.123.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.123.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.123.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.124.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.124.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.124.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.124.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.124.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.124.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.125.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.125.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.125.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.125.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.125.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.125.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.126.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.126.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.126.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.126.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.126.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.126.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.127.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.127.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.127.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.127.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.127.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.127.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.128.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.128.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.128.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.128.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.128.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.128.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.129.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.129.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.129.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.129.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.129.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.129.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.13.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.13.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.13.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.13.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.13.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.13.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.130.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.130.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.130.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.130.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.130.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.130.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.131.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.131.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.131.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.131.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.131.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.131.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.132.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.132.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.132.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.132.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.132.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.132.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.133.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.133.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.133.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.133.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.133.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.133.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.134.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.134.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.134.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.134.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.134.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.134.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.135.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.135.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.135.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.135.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.135.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.135.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.136.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.136.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.136.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.136.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.136.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.136.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.137.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.137.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.137.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.137.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.137.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.137.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.138.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.138.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.138.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.138.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.138.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.138.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.139.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.139.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.139.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.139.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.139.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.139.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.14.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.14.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.14.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.14.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.14.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.14.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.140.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.140.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.140.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.140.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.140.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.140.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.141.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.141.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.141.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.141.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.141.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.141.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.142.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.142.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.142.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.142.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.142.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.142.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.143.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.143.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.143.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.143.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.143.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.143.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.144.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.144.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.144.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.144.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.144.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.144.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.145.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.145.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.145.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.145.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.145.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.145.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.146.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.146.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.146.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.146.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.146.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.146.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.147.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.147.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.147.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.147.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.147.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.147.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.148.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.148.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.148.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.148.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.148.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.148.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.149.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.149.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.149.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.149.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.149.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.149.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.15.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.15.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.15.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.15.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.15.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.15.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.150.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.150.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.150.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.150.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.150.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.150.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.151.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.151.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.151.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.151.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.151.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.151.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.152.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.152.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.152.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.152.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.152.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.152.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.153.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.153.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.153.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.153.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.153.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.153.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.154.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.154.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.154.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.154.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.154.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.154.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.155.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.155.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.155.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.155.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.155.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.155.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.156.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.156.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.156.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.156.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.156.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.156.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.157.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.157.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.157.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.157.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.157.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.157.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.158.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.158.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.158.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.158.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.158.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.158.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.159.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.159.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.159.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.159.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.159.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.159.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.16.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.16.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.16.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.16.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.16.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.16.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.17.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.17.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.17.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.17.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.17.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.17.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.18.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.18.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.18.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.18.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.18.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.18.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.19.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.19.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.19.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.19.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.19.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.19.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.2.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.2.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.2.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.2.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.2.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.2.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.20.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.20.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.20.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.20.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.20.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.20.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.21.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.21.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.21.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.21.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.21.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.21.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.22.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.22.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.22.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.22.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.22.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.22.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.23.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.23.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.23.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.23.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.23.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.23.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.24.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.24.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.24.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.24.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.24.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.24.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.25.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.25.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.25.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.25.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.25.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.25.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.26.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.26.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.26.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.26.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.26.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.26.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.27.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.27.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.27.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.27.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.27.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.27.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.28.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.28.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.28.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.28.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.28.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.28.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.29.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.29.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.29.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.29.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.29.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.29.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.3.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.3.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.3.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.3.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.3.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.3.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.30.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.30.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.30.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.30.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.30.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.30.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.31.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.31.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.31.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.31.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.31.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.31.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.32.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.32.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.32.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.32.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.32.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.32.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.33.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.33.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.33.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.33.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.33.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.33.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.34.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.34.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.34.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.34.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.34.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.34.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.35.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.35.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.35.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.35.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.35.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.35.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.36.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.36.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.36.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.36.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.36.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.36.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.37.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.37.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.37.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.37.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.37.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.37.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.38.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.38.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.38.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.38.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.38.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.38.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.39.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.39.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.39.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.39.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.39.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.39.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.4.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.4.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.4.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.4.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.4.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.4.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.40.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.40.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.40.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.40.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.40.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.40.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.41.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.41.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.41.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.41.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.41.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.41.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.42.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.42.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.42.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.42.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.42.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.42.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.43.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.43.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.43.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.43.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.43.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.43.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.44.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.44.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.44.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.44.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.44.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.44.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.45.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.45.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.45.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.45.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.45.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.45.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.46.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.46.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.46.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.46.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.46.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.46.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.47.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.47.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.47.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.47.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.47.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.47.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.48.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.48.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.48.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.48.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.48.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.48.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.49.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.49.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.49.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.49.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.49.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.49.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.5.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.5.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.5.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.5.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.5.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.5.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.50.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.50.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.50.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.50.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.50.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.50.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.51.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.51.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.51.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.51.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.51.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.51.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.52.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.52.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.52.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.52.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.52.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.52.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.53.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.53.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.53.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.53.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.53.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.53.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.54.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.54.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.54.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.54.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.54.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.54.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.55.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.55.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.55.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.55.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.55.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.55.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.56.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.56.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.56.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.56.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.56.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.56.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.57.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.57.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.57.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.57.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.57.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.57.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.58.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.58.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.58.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.58.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.58.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.58.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.59.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.59.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.59.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.59.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.59.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.59.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.6.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.6.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.6.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.6.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.6.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.6.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.60.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.60.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.60.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.60.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.60.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.60.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.61.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.61.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.61.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.61.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.61.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.61.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.62.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.62.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.62.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.62.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.62.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.62.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.63.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.63.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.63.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.63.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.63.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.63.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.64.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.64.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.64.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.64.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.64.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.64.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.65.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.65.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.65.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.65.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.65.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.65.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.66.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.66.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.66.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.66.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.66.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.66.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.67.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.67.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.67.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.67.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.67.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.67.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.68.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.68.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.68.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.68.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.68.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.68.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.69.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.69.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.69.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.69.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.69.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.69.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.7.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.7.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.7.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.7.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.7.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.7.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.70.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.70.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.70.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.70.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.70.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.70.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.71.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.71.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.71.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.71.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.71.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.71.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.72.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.72.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.72.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.72.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.72.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.72.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.73.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.73.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.73.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.73.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.73.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.73.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.74.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.74.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.74.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.74.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.74.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.74.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.75.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.75.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.75.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.75.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.75.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.75.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.76.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.76.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.76.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.76.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.76.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.76.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.77.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.77.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.77.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.77.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.77.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.77.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.78.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.78.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.78.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.78.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.78.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.78.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.79.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.79.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.79.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.79.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.79.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.79.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.8.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.8.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.8.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.8.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.8.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.8.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.80.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.80.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.80.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.80.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.80.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.80.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.81.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.81.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.81.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.81.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.81.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.81.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.82.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.82.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.82.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.82.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.82.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.82.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.83.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.83.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.83.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.83.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.83.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.83.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.84.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.84.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.84.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.84.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.84.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.84.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.85.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.85.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.85.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.85.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.85.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.85.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.86.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.86.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.86.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.86.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.86.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.86.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.87.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.87.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.87.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.87.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.87.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.87.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.88.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.88.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.88.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.88.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.88.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.88.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.89.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.89.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.89.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.89.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.89.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.89.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.9.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.9.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.9.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.9.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.9.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.9.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.90.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.90.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.90.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.90.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.90.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.90.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.91.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.91.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.91.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.91.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.91.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.91.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.92.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.92.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.92.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.92.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.92.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.92.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.93.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.93.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.93.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.93.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.93.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.93.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.94.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.94.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.94.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.94.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.94.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.94.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.95.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.95.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.95.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.95.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.95.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.95.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.96.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.96.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.96.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.96.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.96.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.96.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.97.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.97.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.97.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.97.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.97.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.97.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.98.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.98.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.98.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.98.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.98.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.98.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.99.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.99.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.99.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.99.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.99.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.experts.99.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.gate.e_score_correction_bias": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.gate.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.shared_experts.down_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.shared_experts.down_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.shared_experts.gate_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.shared_experts.gate_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.shared_experts.up_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.mlp.shared_experts.up_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.post_attention_layernorm.weight": "model-00085-of-00092.safetensors", + "model.layers.84.self_attn.k_norm.weight": "model-00085-of-00092.safetensors", + "model.layers.84.self_attn.k_proj.bias": "model-00085-of-00092.safetensors", + "model.layers.84.self_attn.k_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.self_attn.k_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.self_attn.o_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.self_attn.o_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.self_attn.q_norm.weight": "model-00085-of-00092.safetensors", + "model.layers.84.self_attn.q_proj.bias": "model-00085-of-00092.safetensors", + "model.layers.84.self_attn.q_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.self_attn.q_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.84.self_attn.v_proj.bias": "model-00085-of-00092.safetensors", + "model.layers.84.self_attn.v_proj.weight": "model-00085-of-00092.safetensors", + "model.layers.84.self_attn.v_proj.weight_scale": "model-00085-of-00092.safetensors", + "model.layers.85.input_layernorm.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.0.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.0.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.0.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.0.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.0.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.0.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.1.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.1.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.1.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.1.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.1.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.1.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.10.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.10.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.10.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.10.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.10.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.10.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.100.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.100.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.100.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.100.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.100.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.100.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.101.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.101.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.101.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.101.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.101.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.101.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.102.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.102.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.102.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.102.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.102.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.102.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.103.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.103.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.103.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.103.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.103.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.103.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.104.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.104.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.104.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.104.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.104.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.104.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.105.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.105.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.105.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.105.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.105.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.105.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.106.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.106.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.106.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.106.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.106.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.106.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.107.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.107.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.107.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.107.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.107.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.107.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.108.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.108.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.108.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.108.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.108.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.108.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.109.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.109.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.109.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.109.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.109.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.109.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.11.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.11.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.11.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.11.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.11.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.11.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.110.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.110.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.110.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.110.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.110.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.110.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.111.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.111.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.111.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.111.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.111.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.111.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.112.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.112.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.112.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.112.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.112.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.112.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.113.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.113.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.113.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.113.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.113.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.113.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.114.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.114.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.114.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.114.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.114.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.114.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.115.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.115.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.115.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.115.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.115.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.115.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.116.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.116.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.116.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.116.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.116.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.116.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.117.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.117.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.117.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.117.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.117.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.117.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.118.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.118.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.118.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.118.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.118.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.118.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.119.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.119.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.119.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.119.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.119.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.119.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.12.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.12.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.12.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.12.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.12.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.12.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.120.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.120.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.120.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.120.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.120.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.120.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.121.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.121.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.121.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.121.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.121.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.121.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.122.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.122.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.122.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.122.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.122.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.122.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.123.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.123.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.123.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.123.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.123.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.123.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.124.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.124.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.124.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.124.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.124.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.124.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.125.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.125.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.125.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.125.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.125.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.125.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.126.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.126.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.126.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.126.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.126.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.126.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.127.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.127.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.127.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.127.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.127.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.127.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.128.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.128.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.128.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.128.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.128.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.128.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.129.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.129.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.129.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.129.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.129.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.129.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.13.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.13.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.13.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.13.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.13.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.13.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.130.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.130.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.130.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.130.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.130.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.130.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.131.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.131.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.131.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.131.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.131.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.131.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.132.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.132.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.132.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.132.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.132.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.132.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.133.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.133.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.133.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.133.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.133.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.133.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.134.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.134.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.134.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.134.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.134.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.134.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.135.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.135.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.135.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.135.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.135.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.135.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.136.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.136.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.136.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.136.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.136.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.136.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.137.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.137.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.137.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.137.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.137.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.137.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.138.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.138.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.138.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.138.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.138.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.138.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.139.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.139.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.139.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.139.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.139.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.139.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.14.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.14.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.14.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.14.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.14.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.14.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.140.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.140.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.140.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.140.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.140.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.140.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.141.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.141.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.141.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.141.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.141.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.141.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.142.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.142.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.142.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.142.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.142.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.142.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.143.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.143.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.143.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.143.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.143.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.143.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.144.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.144.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.144.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.144.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.144.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.144.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.145.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.145.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.145.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.145.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.145.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.145.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.146.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.146.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.146.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.146.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.146.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.146.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.147.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.147.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.147.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.147.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.147.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.147.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.148.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.148.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.148.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.148.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.148.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.148.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.149.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.149.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.149.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.149.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.149.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.149.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.15.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.15.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.15.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.15.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.15.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.15.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.150.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.150.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.150.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.150.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.150.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.150.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.151.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.151.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.151.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.151.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.151.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.151.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.152.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.152.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.152.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.152.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.152.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.152.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.153.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.153.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.153.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.153.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.153.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.153.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.154.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.154.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.154.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.154.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.154.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.154.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.155.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.155.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.155.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.155.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.155.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.155.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.156.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.156.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.156.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.156.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.156.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.156.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.157.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.157.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.157.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.157.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.157.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.157.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.158.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.158.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.158.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.158.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.158.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.158.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.159.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.159.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.159.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.159.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.159.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.159.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.16.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.16.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.16.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.16.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.16.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.16.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.17.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.17.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.17.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.17.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.17.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.17.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.18.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.18.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.18.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.18.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.18.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.18.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.19.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.19.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.19.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.19.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.19.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.19.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.2.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.2.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.2.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.2.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.2.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.2.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.20.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.20.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.20.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.20.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.20.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.20.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.21.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.21.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.21.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.21.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.21.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.21.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.22.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.22.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.22.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.22.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.22.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.22.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.23.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.23.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.23.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.23.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.23.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.23.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.24.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.24.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.24.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.24.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.24.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.24.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.25.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.25.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.25.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.25.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.25.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.25.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.26.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.26.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.26.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.26.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.26.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.26.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.27.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.27.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.27.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.27.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.27.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.27.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.28.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.28.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.28.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.28.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.28.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.28.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.29.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.29.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.29.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.29.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.29.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.29.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.3.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.3.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.3.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.3.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.3.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.3.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.30.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.30.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.30.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.30.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.30.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.30.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.31.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.31.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.31.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.31.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.31.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.31.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.32.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.32.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.32.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.32.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.32.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.32.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.33.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.33.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.33.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.33.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.33.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.33.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.34.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.34.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.34.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.34.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.34.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.34.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.35.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.35.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.35.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.35.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.35.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.35.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.36.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.36.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.36.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.36.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.36.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.36.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.37.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.37.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.37.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.37.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.37.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.37.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.38.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.38.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.38.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.38.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.38.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.38.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.39.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.39.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.39.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.39.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.39.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.39.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.4.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.4.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.4.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.4.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.4.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.4.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.40.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.40.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.40.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.40.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.40.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.40.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.41.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.41.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.41.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.41.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.41.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.41.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.42.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.42.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.42.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.42.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.42.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.42.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.43.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.43.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.43.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.43.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.43.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.43.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.44.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.44.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.44.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.44.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.44.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.44.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.45.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.45.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.45.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.45.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.45.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.45.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.46.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.46.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.46.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.46.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.46.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.46.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.47.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.47.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.47.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.47.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.47.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.47.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.48.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.48.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.48.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.48.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.48.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.48.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.49.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.49.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.49.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.49.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.49.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.49.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.5.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.5.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.5.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.5.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.5.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.5.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.50.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.50.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.50.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.50.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.50.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.50.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.51.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.51.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.51.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.51.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.51.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.51.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.52.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.52.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.52.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.52.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.52.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.52.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.53.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.53.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.53.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.53.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.53.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.53.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.54.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.54.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.54.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.54.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.54.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.54.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.55.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.55.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.55.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.55.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.55.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.55.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.56.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.56.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.56.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.56.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.56.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.56.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.57.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.57.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.57.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.57.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.57.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.57.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.58.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.58.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.58.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.58.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.58.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.58.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.59.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.59.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.59.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.59.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.59.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.59.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.6.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.6.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.6.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.6.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.6.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.6.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.60.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.60.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.60.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.60.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.60.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.60.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.61.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.61.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.61.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.61.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.61.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.61.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.62.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.62.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.62.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.62.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.62.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.62.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.63.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.63.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.63.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.63.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.63.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.63.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.64.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.64.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.64.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.64.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.64.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.64.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.65.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.65.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.65.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.65.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.65.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.65.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.66.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.66.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.66.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.66.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.66.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.66.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.67.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.67.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.67.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.67.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.67.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.67.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.68.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.68.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.68.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.68.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.68.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.68.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.69.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.69.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.69.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.69.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.69.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.69.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.7.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.7.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.7.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.7.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.7.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.7.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.70.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.70.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.70.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.70.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.70.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.70.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.71.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.71.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.71.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.71.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.71.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.71.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.72.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.72.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.72.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.72.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.72.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.72.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.73.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.73.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.73.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.73.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.73.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.73.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.74.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.74.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.74.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.74.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.74.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.74.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.75.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.75.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.75.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.75.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.75.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.75.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.76.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.76.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.76.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.76.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.76.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.76.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.77.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.77.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.77.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.77.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.77.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.77.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.78.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.78.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.78.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.78.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.78.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.78.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.79.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.79.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.79.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.79.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.79.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.79.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.8.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.8.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.8.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.8.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.8.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.8.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.80.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.80.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.80.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.80.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.80.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.80.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.81.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.81.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.81.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.81.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.81.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.81.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.82.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.82.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.82.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.82.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.82.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.82.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.83.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.83.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.83.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.83.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.83.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.83.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.84.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.84.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.84.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.84.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.84.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.84.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.85.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.85.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.85.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.85.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.85.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.85.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.86.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.86.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.86.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.86.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.86.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.86.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.87.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.87.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.87.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.87.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.87.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.87.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.88.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.88.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.88.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.88.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.88.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.88.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.89.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.89.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.89.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.89.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.89.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.89.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.9.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.9.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.9.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.9.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.9.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.9.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.90.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.90.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.90.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.90.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.90.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.90.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.91.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.91.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.91.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.91.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.91.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.91.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.92.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.92.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.92.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.92.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.92.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.92.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.93.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.93.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.93.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.93.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.93.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.93.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.94.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.94.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.94.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.94.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.94.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.94.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.95.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.95.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.95.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.95.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.95.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.95.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.96.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.96.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.96.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.96.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.96.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.96.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.97.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.97.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.97.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.97.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.97.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.97.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.98.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.98.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.98.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.98.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.98.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.98.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.99.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.99.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.99.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.99.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.99.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.experts.99.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.gate.e_score_correction_bias": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.gate.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.shared_experts.down_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.shared_experts.down_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.shared_experts.gate_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.shared_experts.gate_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.shared_experts.up_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.mlp.shared_experts.up_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.post_attention_layernorm.weight": "model-00086-of-00092.safetensors", + "model.layers.85.self_attn.k_norm.weight": "model-00086-of-00092.safetensors", + "model.layers.85.self_attn.k_proj.bias": "model-00086-of-00092.safetensors", + "model.layers.85.self_attn.k_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.self_attn.k_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.self_attn.o_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.self_attn.o_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.self_attn.q_norm.weight": "model-00086-of-00092.safetensors", + "model.layers.85.self_attn.q_proj.bias": "model-00086-of-00092.safetensors", + "model.layers.85.self_attn.q_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.self_attn.q_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.85.self_attn.v_proj.bias": "model-00086-of-00092.safetensors", + "model.layers.85.self_attn.v_proj.weight": "model-00086-of-00092.safetensors", + "model.layers.85.self_attn.v_proj.weight_scale": "model-00086-of-00092.safetensors", + "model.layers.86.input_layernorm.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.0.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.0.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.0.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.0.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.0.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.0.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.1.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.1.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.1.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.1.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.1.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.1.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.10.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.10.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.10.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.10.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.10.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.10.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.100.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.100.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.100.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.100.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.100.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.100.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.101.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.101.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.101.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.101.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.101.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.101.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.102.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.102.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.102.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.102.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.102.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.102.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.103.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.103.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.103.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.103.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.103.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.103.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.104.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.104.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.104.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.104.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.104.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.104.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.105.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.105.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.105.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.105.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.105.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.105.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.106.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.106.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.106.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.106.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.106.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.106.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.107.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.107.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.107.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.107.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.107.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.107.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.108.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.108.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.108.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.108.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.108.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.108.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.109.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.109.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.109.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.109.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.109.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.109.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.11.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.11.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.11.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.11.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.11.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.11.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.110.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.110.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.110.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.110.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.110.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.110.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.111.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.111.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.111.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.111.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.111.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.111.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.112.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.112.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.112.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.112.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.112.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.112.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.113.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.113.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.113.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.113.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.113.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.113.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.114.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.114.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.114.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.114.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.114.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.114.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.115.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.115.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.115.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.115.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.115.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.115.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.116.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.116.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.116.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.116.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.116.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.116.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.117.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.117.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.117.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.117.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.117.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.117.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.118.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.118.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.118.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.118.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.118.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.118.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.119.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.119.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.119.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.119.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.119.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.119.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.12.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.12.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.12.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.12.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.12.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.12.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.120.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.120.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.120.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.120.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.120.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.120.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.121.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.121.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.121.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.121.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.121.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.121.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.122.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.122.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.122.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.122.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.122.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.122.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.123.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.123.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.123.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.123.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.123.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.123.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.124.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.124.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.124.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.124.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.124.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.124.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.125.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.125.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.125.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.125.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.125.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.125.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.126.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.126.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.126.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.126.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.126.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.126.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.127.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.127.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.127.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.127.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.127.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.127.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.128.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.128.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.128.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.128.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.128.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.128.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.129.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.129.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.129.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.129.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.129.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.129.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.13.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.13.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.13.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.13.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.13.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.13.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.130.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.130.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.130.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.130.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.130.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.130.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.131.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.131.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.131.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.131.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.131.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.131.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.132.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.132.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.132.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.132.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.132.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.132.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.133.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.133.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.133.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.133.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.133.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.133.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.134.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.134.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.134.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.134.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.134.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.134.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.135.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.135.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.135.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.135.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.135.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.135.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.136.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.136.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.136.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.136.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.136.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.136.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.137.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.137.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.137.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.137.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.137.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.137.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.138.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.138.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.138.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.138.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.138.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.138.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.139.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.139.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.139.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.139.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.139.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.139.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.14.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.14.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.14.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.14.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.14.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.14.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.140.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.140.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.140.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.140.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.140.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.140.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.141.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.141.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.141.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.141.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.141.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.141.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.142.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.142.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.142.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.142.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.142.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.142.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.143.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.143.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.143.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.143.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.143.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.143.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.144.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.144.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.144.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.144.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.144.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.144.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.145.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.145.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.145.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.145.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.145.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.145.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.146.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.146.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.146.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.146.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.146.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.146.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.147.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.147.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.147.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.147.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.147.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.147.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.148.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.148.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.148.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.148.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.148.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.148.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.149.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.149.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.149.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.149.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.149.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.149.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.15.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.15.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.15.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.15.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.15.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.15.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.150.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.150.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.150.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.150.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.150.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.150.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.151.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.151.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.151.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.151.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.151.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.151.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.152.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.152.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.152.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.152.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.152.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.152.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.153.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.153.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.153.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.153.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.153.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.153.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.154.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.154.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.154.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.154.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.154.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.154.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.155.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.155.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.155.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.155.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.155.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.155.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.156.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.156.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.156.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.156.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.156.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.156.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.157.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.157.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.157.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.157.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.157.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.157.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.158.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.158.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.158.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.158.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.158.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.158.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.159.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.159.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.159.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.159.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.159.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.159.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.16.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.16.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.16.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.16.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.16.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.16.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.17.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.17.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.17.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.17.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.17.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.17.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.18.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.18.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.18.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.18.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.18.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.18.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.19.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.19.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.19.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.19.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.19.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.19.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.2.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.2.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.2.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.2.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.2.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.2.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.20.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.20.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.20.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.20.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.20.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.20.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.21.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.21.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.21.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.21.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.21.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.21.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.22.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.22.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.22.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.22.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.22.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.22.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.23.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.23.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.23.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.23.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.23.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.23.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.24.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.24.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.24.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.24.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.24.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.24.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.25.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.25.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.25.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.25.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.25.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.25.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.26.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.26.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.26.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.26.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.26.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.26.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.27.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.27.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.27.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.27.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.27.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.27.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.28.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.28.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.28.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.28.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.28.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.28.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.29.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.29.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.29.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.29.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.29.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.29.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.3.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.3.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.3.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.3.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.3.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.3.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.30.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.30.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.30.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.30.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.30.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.30.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.31.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.31.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.31.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.31.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.31.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.31.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.32.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.32.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.32.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.32.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.32.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.32.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.33.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.33.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.33.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.33.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.33.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.33.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.34.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.34.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.34.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.34.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.34.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.34.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.35.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.35.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.35.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.35.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.35.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.35.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.36.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.36.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.36.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.36.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.36.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.36.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.37.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.37.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.37.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.37.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.37.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.37.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.38.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.38.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.38.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.38.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.38.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.38.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.39.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.39.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.39.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.39.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.39.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.39.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.4.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.4.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.4.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.4.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.4.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.4.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.40.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.40.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.40.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.40.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.40.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.40.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.41.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.41.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.41.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.41.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.41.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.41.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.42.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.42.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.42.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.42.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.42.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.42.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.43.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.43.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.43.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.43.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.43.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.43.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.44.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.44.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.44.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.44.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.44.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.44.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.45.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.45.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.45.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.45.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.45.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.45.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.46.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.46.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.46.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.46.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.46.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.46.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.47.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.47.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.47.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.47.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.47.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.47.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.48.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.48.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.48.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.48.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.48.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.48.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.49.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.49.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.49.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.49.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.49.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.49.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.5.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.5.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.5.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.5.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.5.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.5.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.50.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.50.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.50.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.50.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.50.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.50.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.51.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.51.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.51.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.51.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.51.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.51.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.52.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.52.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.52.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.52.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.52.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.52.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.53.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.53.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.53.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.53.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.53.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.53.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.54.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.54.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.54.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.54.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.54.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.54.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.55.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.55.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.55.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.55.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.55.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.55.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.56.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.56.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.56.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.56.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.56.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.56.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.57.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.57.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.57.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.57.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.57.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.57.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.58.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.58.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.58.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.58.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.58.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.58.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.59.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.59.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.59.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.59.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.59.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.59.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.6.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.6.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.6.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.6.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.6.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.6.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.60.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.60.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.60.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.60.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.60.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.60.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.61.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.61.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.61.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.61.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.61.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.61.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.62.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.62.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.62.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.62.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.62.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.62.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.63.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.63.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.63.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.63.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.63.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.63.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.64.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.64.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.64.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.64.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.64.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.64.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.65.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.65.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.65.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.65.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.65.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.65.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.66.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.66.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.66.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.66.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.66.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.66.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.67.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.67.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.67.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.67.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.67.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.67.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.68.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.68.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.68.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.68.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.68.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.68.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.69.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.69.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.69.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.69.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.69.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.69.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.7.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.7.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.7.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.7.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.7.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.7.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.70.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.70.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.70.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.70.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.70.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.70.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.71.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.71.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.71.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.71.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.71.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.71.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.72.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.72.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.72.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.72.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.72.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.72.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.73.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.73.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.73.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.73.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.73.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.73.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.74.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.74.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.74.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.74.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.74.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.74.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.75.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.75.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.75.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.75.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.75.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.75.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.76.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.76.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.76.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.76.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.76.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.76.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.77.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.77.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.77.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.77.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.77.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.77.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.78.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.78.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.78.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.78.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.78.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.78.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.79.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.79.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.79.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.79.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.79.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.79.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.8.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.8.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.8.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.8.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.8.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.8.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.80.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.80.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.80.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.80.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.80.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.80.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.81.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.81.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.81.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.81.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.81.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.81.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.82.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.82.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.82.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.82.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.82.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.82.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.83.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.83.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.83.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.83.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.83.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.83.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.84.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.84.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.84.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.84.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.84.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.84.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.85.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.85.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.85.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.85.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.85.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.85.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.86.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.86.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.86.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.86.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.86.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.86.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.87.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.87.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.87.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.87.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.87.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.87.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.88.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.88.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.88.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.88.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.88.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.88.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.89.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.89.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.89.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.89.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.89.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.89.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.9.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.9.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.9.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.9.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.9.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.9.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.90.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.90.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.90.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.90.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.90.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.90.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.91.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.91.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.91.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.91.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.91.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.91.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.92.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.92.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.92.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.92.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.92.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.92.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.93.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.93.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.93.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.93.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.93.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.93.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.94.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.94.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.94.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.94.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.94.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.94.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.95.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.95.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.95.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.95.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.95.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.95.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.96.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.96.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.96.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.96.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.96.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.96.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.97.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.97.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.97.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.97.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.97.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.97.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.98.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.98.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.98.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.98.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.98.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.98.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.99.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.99.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.99.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.99.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.99.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.experts.99.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.gate.e_score_correction_bias": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.gate.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.shared_experts.down_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.shared_experts.down_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.shared_experts.gate_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.shared_experts.gate_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.shared_experts.up_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.mlp.shared_experts.up_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.post_attention_layernorm.weight": "model-00087-of-00092.safetensors", + "model.layers.86.self_attn.k_norm.weight": "model-00087-of-00092.safetensors", + "model.layers.86.self_attn.k_proj.bias": "model-00087-of-00092.safetensors", + "model.layers.86.self_attn.k_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.self_attn.k_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.self_attn.o_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.self_attn.o_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.self_attn.q_norm.weight": "model-00087-of-00092.safetensors", + "model.layers.86.self_attn.q_proj.bias": "model-00087-of-00092.safetensors", + "model.layers.86.self_attn.q_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.self_attn.q_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.86.self_attn.v_proj.bias": "model-00087-of-00092.safetensors", + "model.layers.86.self_attn.v_proj.weight": "model-00087-of-00092.safetensors", + "model.layers.86.self_attn.v_proj.weight_scale": "model-00087-of-00092.safetensors", + "model.layers.87.input_layernorm.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.0.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.0.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.0.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.0.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.0.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.0.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.1.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.1.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.1.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.1.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.1.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.1.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.10.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.10.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.10.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.10.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.10.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.10.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.100.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.100.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.100.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.100.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.100.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.100.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.101.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.101.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.101.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.101.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.101.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.101.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.102.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.102.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.102.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.102.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.102.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.102.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.103.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.103.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.103.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.103.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.103.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.103.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.104.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.104.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.104.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.104.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.104.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.104.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.105.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.105.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.105.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.105.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.105.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.105.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.106.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.106.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.106.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.106.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.106.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.106.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.107.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.107.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.107.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.107.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.107.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.107.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.108.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.108.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.108.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.108.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.108.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.108.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.109.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.109.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.109.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.109.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.109.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.109.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.11.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.11.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.11.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.11.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.11.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.11.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.110.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.110.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.110.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.110.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.110.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.110.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.111.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.111.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.111.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.111.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.111.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.111.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.112.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.112.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.112.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.112.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.112.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.112.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.113.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.113.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.113.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.113.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.113.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.113.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.114.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.114.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.114.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.114.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.114.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.114.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.115.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.115.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.115.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.115.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.115.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.115.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.116.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.116.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.116.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.116.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.116.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.116.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.117.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.117.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.117.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.117.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.117.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.117.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.118.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.118.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.118.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.118.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.118.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.118.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.119.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.119.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.119.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.119.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.119.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.119.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.12.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.12.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.12.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.12.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.12.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.12.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.120.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.120.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.120.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.120.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.120.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.120.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.121.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.121.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.121.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.121.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.121.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.121.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.122.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.122.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.122.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.122.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.122.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.122.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.123.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.123.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.123.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.123.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.123.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.123.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.124.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.124.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.124.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.124.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.124.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.124.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.125.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.125.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.125.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.125.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.125.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.125.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.126.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.126.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.126.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.126.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.126.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.126.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.127.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.127.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.127.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.127.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.127.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.127.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.128.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.128.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.128.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.128.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.128.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.128.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.129.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.129.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.129.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.129.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.129.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.129.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.13.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.13.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.13.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.13.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.13.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.13.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.130.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.130.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.130.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.130.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.130.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.130.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.131.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.131.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.131.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.131.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.131.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.131.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.132.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.132.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.132.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.132.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.132.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.132.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.133.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.133.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.133.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.133.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.133.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.133.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.134.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.134.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.134.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.134.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.134.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.134.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.135.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.135.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.135.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.135.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.135.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.135.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.136.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.136.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.136.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.136.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.136.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.136.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.137.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.137.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.137.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.137.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.137.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.137.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.138.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.138.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.138.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.138.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.138.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.138.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.139.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.139.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.139.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.139.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.139.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.139.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.14.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.14.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.14.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.14.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.14.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.14.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.140.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.140.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.140.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.140.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.140.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.140.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.141.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.141.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.141.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.141.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.141.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.141.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.142.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.142.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.142.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.142.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.142.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.142.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.143.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.143.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.143.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.143.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.143.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.143.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.144.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.144.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.144.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.144.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.144.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.144.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.145.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.145.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.145.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.145.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.145.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.145.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.146.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.146.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.146.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.146.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.146.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.146.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.147.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.147.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.147.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.147.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.147.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.147.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.148.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.148.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.148.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.148.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.148.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.148.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.149.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.149.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.149.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.149.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.149.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.149.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.15.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.15.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.15.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.15.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.15.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.15.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.150.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.150.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.150.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.150.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.150.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.150.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.151.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.151.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.151.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.151.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.151.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.151.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.152.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.152.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.152.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.152.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.152.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.152.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.153.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.153.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.153.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.153.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.153.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.153.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.154.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.154.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.154.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.154.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.154.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.154.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.155.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.155.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.155.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.155.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.155.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.155.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.156.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.156.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.156.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.156.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.156.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.156.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.157.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.157.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.157.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.157.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.157.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.157.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.158.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.158.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.158.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.158.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.158.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.158.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.159.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.159.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.159.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.159.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.159.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.159.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.16.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.16.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.16.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.16.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.16.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.16.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.17.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.17.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.17.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.17.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.17.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.17.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.18.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.18.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.18.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.18.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.18.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.18.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.19.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.19.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.19.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.19.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.19.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.19.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.2.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.2.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.2.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.2.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.2.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.2.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.20.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.20.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.20.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.20.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.20.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.20.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.21.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.21.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.21.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.21.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.21.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.21.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.22.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.22.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.22.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.22.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.22.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.22.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.23.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.23.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.23.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.23.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.23.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.23.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.24.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.24.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.24.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.24.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.24.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.24.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.25.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.25.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.25.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.25.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.25.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.25.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.26.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.26.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.26.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.26.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.26.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.26.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.27.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.27.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.27.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.27.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.27.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.27.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.28.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.28.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.28.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.28.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.28.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.28.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.29.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.29.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.29.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.29.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.29.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.29.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.3.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.3.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.3.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.3.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.3.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.3.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.30.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.30.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.30.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.30.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.30.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.30.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.31.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.31.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.31.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.31.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.31.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.31.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.32.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.32.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.32.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.32.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.32.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.32.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.33.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.33.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.33.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.33.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.33.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.33.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.34.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.34.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.34.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.34.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.34.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.34.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.35.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.35.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.35.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.35.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.35.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.35.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.36.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.36.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.36.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.36.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.36.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.36.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.37.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.37.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.37.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.37.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.37.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.37.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.38.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.38.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.38.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.38.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.38.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.38.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.39.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.39.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.39.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.39.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.39.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.39.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.4.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.4.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.4.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.4.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.4.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.4.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.40.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.40.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.40.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.40.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.40.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.40.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.41.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.41.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.41.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.41.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.41.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.41.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.42.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.42.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.42.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.42.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.42.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.42.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.43.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.43.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.43.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.43.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.43.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.43.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.44.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.44.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.44.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.44.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.44.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.44.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.45.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.45.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.45.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.45.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.45.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.45.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.46.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.46.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.46.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.46.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.46.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.46.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.47.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.47.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.47.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.47.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.47.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.47.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.48.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.48.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.48.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.48.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.48.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.48.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.49.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.49.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.49.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.49.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.49.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.49.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.5.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.5.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.5.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.5.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.5.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.5.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.50.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.50.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.50.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.50.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.50.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.50.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.51.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.51.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.51.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.51.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.51.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.51.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.52.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.52.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.52.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.52.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.52.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.52.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.53.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.53.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.53.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.53.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.53.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.53.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.54.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.54.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.54.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.54.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.54.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.54.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.55.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.55.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.55.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.55.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.55.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.55.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.56.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.56.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.56.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.56.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.56.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.56.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.57.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.57.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.57.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.57.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.57.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.57.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.58.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.58.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.58.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.58.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.58.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.58.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.59.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.59.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.59.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.59.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.59.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.59.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.6.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.6.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.6.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.6.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.6.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.6.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.60.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.60.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.60.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.60.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.60.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.60.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.61.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.61.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.61.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.61.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.61.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.61.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.62.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.62.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.62.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.62.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.62.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.62.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.63.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.63.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.63.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.63.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.63.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.63.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.64.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.64.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.64.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.64.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.64.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.64.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.65.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.65.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.65.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.65.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.65.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.65.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.66.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.66.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.66.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.66.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.66.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.66.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.67.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.67.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.67.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.67.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.67.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.67.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.68.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.68.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.68.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.68.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.68.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.68.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.69.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.69.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.69.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.69.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.69.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.69.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.7.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.7.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.7.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.7.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.7.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.7.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.70.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.70.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.70.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.70.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.70.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.70.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.71.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.71.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.71.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.71.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.71.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.71.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.72.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.72.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.72.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.72.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.72.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.72.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.73.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.73.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.73.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.73.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.73.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.73.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.74.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.74.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.74.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.74.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.74.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.74.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.75.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.75.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.75.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.75.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.75.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.75.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.76.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.76.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.76.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.76.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.76.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.76.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.77.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.77.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.77.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.77.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.77.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.77.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.78.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.78.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.78.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.78.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.78.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.78.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.79.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.79.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.79.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.79.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.79.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.79.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.8.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.8.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.8.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.8.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.8.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.8.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.80.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.80.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.80.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.80.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.80.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.80.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.81.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.81.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.81.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.81.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.81.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.81.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.82.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.82.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.82.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.82.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.82.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.82.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.83.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.83.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.83.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.83.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.83.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.83.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.84.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.84.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.84.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.84.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.84.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.84.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.85.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.85.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.85.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.85.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.85.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.85.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.86.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.86.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.86.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.86.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.86.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.86.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.87.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.87.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.87.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.87.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.87.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.87.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.88.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.88.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.88.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.88.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.88.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.88.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.89.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.89.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.89.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.89.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.89.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.89.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.9.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.9.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.9.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.9.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.9.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.9.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.90.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.90.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.90.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.90.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.90.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.90.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.91.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.91.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.91.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.91.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.91.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.91.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.92.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.92.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.92.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.92.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.92.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.92.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.93.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.93.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.93.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.93.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.93.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.93.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.94.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.94.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.94.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.94.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.94.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.94.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.95.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.95.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.95.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.95.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.95.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.95.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.96.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.96.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.96.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.96.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.96.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.96.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.97.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.97.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.97.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.97.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.97.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.97.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.98.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.98.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.98.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.98.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.98.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.98.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.99.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.99.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.99.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.99.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.99.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.experts.99.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.gate.e_score_correction_bias": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.gate.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.shared_experts.down_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.shared_experts.down_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.shared_experts.gate_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.shared_experts.gate_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.shared_experts.up_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.mlp.shared_experts.up_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.post_attention_layernorm.weight": "model-00088-of-00092.safetensors", + "model.layers.87.self_attn.k_norm.weight": "model-00088-of-00092.safetensors", + "model.layers.87.self_attn.k_proj.bias": "model-00088-of-00092.safetensors", + "model.layers.87.self_attn.k_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.self_attn.k_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.self_attn.o_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.self_attn.o_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.self_attn.q_norm.weight": "model-00088-of-00092.safetensors", + "model.layers.87.self_attn.q_proj.bias": "model-00088-of-00092.safetensors", + "model.layers.87.self_attn.q_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.self_attn.q_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.87.self_attn.v_proj.bias": "model-00088-of-00092.safetensors", + "model.layers.87.self_attn.v_proj.weight": "model-00088-of-00092.safetensors", + "model.layers.87.self_attn.v_proj.weight_scale": "model-00088-of-00092.safetensors", + "model.layers.88.input_layernorm.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.0.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.0.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.0.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.0.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.0.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.0.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.1.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.1.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.1.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.1.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.1.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.1.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.10.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.10.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.10.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.10.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.10.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.10.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.100.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.100.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.100.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.100.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.100.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.100.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.101.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.101.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.101.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.101.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.101.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.101.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.102.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.102.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.102.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.102.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.102.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.102.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.103.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.103.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.103.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.103.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.103.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.103.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.104.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.104.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.104.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.104.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.104.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.104.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.105.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.105.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.105.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.105.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.105.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.105.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.106.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.106.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.106.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.106.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.106.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.106.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.107.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.107.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.107.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.107.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.107.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.107.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.108.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.108.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.108.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.108.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.108.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.108.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.109.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.109.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.109.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.109.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.109.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.109.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.11.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.11.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.11.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.11.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.11.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.11.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.110.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.110.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.110.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.110.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.110.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.110.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.111.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.111.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.111.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.111.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.111.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.111.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.112.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.112.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.112.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.112.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.112.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.112.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.113.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.113.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.113.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.113.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.113.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.113.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.114.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.114.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.114.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.114.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.114.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.114.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.115.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.115.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.115.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.115.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.115.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.115.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.116.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.116.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.116.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.116.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.116.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.116.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.117.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.117.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.117.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.117.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.117.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.117.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.118.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.118.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.118.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.118.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.118.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.118.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.119.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.119.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.119.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.119.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.119.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.119.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.12.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.12.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.12.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.12.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.12.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.12.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.120.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.120.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.120.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.120.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.120.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.120.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.121.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.121.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.121.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.121.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.121.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.121.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.122.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.122.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.122.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.122.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.122.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.122.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.123.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.123.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.123.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.123.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.123.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.123.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.124.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.124.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.124.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.124.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.124.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.124.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.125.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.125.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.125.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.125.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.125.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.125.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.126.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.126.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.126.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.126.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.126.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.126.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.127.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.127.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.127.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.127.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.127.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.127.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.128.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.128.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.128.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.128.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.128.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.128.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.129.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.129.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.129.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.129.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.129.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.129.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.13.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.13.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.13.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.13.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.13.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.13.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.130.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.130.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.130.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.130.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.130.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.130.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.131.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.131.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.131.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.131.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.131.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.131.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.132.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.132.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.132.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.132.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.132.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.132.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.133.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.133.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.133.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.133.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.133.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.133.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.134.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.134.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.134.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.134.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.134.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.134.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.135.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.135.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.135.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.135.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.135.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.135.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.136.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.136.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.136.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.136.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.136.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.136.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.137.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.137.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.137.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.137.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.137.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.137.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.138.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.138.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.138.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.138.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.138.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.138.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.139.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.139.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.139.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.139.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.139.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.139.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.14.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.14.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.14.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.14.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.14.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.14.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.140.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.140.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.140.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.140.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.140.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.140.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.141.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.141.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.141.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.141.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.141.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.141.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.142.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.142.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.142.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.142.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.142.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.142.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.143.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.143.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.143.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.143.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.143.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.143.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.144.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.144.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.144.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.144.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.144.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.144.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.145.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.145.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.145.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.145.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.145.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.145.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.146.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.146.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.146.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.146.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.146.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.146.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.147.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.147.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.147.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.147.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.147.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.147.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.148.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.148.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.148.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.148.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.148.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.148.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.149.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.149.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.149.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.149.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.149.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.149.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.15.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.15.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.15.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.15.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.15.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.15.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.150.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.150.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.150.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.150.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.150.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.150.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.151.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.151.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.151.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.151.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.151.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.151.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.152.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.152.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.152.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.152.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.152.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.152.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.153.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.153.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.153.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.153.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.153.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.153.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.154.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.154.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.154.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.154.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.154.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.154.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.155.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.155.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.155.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.155.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.155.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.155.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.156.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.156.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.156.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.156.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.156.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.156.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.157.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.157.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.157.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.157.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.157.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.157.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.158.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.158.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.158.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.158.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.158.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.158.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.159.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.159.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.159.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.159.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.159.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.159.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.16.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.16.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.16.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.16.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.16.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.16.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.17.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.17.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.17.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.17.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.17.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.17.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.18.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.18.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.18.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.18.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.18.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.18.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.19.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.19.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.19.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.19.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.19.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.19.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.2.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.2.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.2.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.2.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.2.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.2.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.20.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.20.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.20.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.20.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.20.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.20.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.21.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.21.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.21.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.21.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.21.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.21.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.22.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.22.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.22.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.22.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.22.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.22.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.23.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.23.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.23.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.23.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.23.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.23.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.24.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.24.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.24.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.24.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.24.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.24.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.25.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.25.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.25.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.25.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.25.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.25.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.26.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.26.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.26.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.26.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.26.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.26.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.27.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.27.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.27.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.27.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.27.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.27.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.28.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.28.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.28.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.28.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.28.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.28.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.29.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.29.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.29.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.29.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.29.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.29.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.3.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.3.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.3.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.3.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.3.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.3.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.30.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.30.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.30.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.30.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.30.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.30.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.31.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.31.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.31.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.31.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.31.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.31.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.32.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.32.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.32.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.32.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.32.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.32.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.33.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.33.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.33.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.33.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.33.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.33.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.34.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.34.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.34.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.34.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.34.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.34.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.35.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.35.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.35.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.35.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.35.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.35.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.36.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.36.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.36.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.36.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.36.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.36.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.37.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.37.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.37.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.37.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.37.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.37.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.38.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.38.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.38.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.38.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.38.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.38.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.39.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.39.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.39.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.39.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.39.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.39.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.4.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.4.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.4.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.4.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.4.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.4.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.40.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.40.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.40.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.40.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.40.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.40.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.41.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.41.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.41.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.41.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.41.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.41.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.42.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.42.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.42.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.42.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.42.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.42.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.43.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.43.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.43.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.43.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.43.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.43.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.44.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.44.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.44.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.44.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.44.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.44.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.45.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.45.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.45.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.45.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.45.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.45.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.46.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.46.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.46.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.46.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.46.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.46.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.47.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.47.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.47.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.47.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.47.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.47.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.48.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.48.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.48.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.48.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.48.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.48.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.49.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.49.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.49.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.49.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.49.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.49.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.5.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.5.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.5.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.5.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.5.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.5.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.50.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.50.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.50.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.50.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.50.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.50.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.51.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.51.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.51.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.51.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.51.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.51.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.52.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.52.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.52.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.52.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.52.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.52.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.53.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.53.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.53.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.53.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.53.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.53.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.54.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.54.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.54.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.54.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.54.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.54.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.55.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.55.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.55.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.55.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.55.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.55.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.56.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.56.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.56.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.56.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.56.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.56.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.57.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.57.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.57.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.57.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.57.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.57.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.58.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.58.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.58.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.58.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.58.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.58.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.59.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.59.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.59.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.59.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.59.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.59.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.6.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.6.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.6.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.6.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.6.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.6.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.60.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.60.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.60.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.60.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.60.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.60.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.61.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.61.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.61.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.61.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.61.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.61.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.62.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.62.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.62.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.62.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.62.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.62.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.63.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.63.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.63.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.63.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.63.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.63.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.64.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.64.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.64.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.64.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.64.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.64.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.65.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.65.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.65.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.65.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.65.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.65.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.66.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.66.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.66.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.66.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.66.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.66.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.67.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.67.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.67.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.67.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.67.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.67.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.68.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.68.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.68.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.68.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.68.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.68.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.69.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.69.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.69.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.69.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.69.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.69.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.7.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.7.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.7.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.7.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.7.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.7.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.70.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.70.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.70.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.70.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.70.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.70.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.71.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.71.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.71.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.71.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.71.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.71.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.72.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.72.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.72.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.72.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.72.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.72.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.73.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.73.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.73.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.73.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.73.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.73.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.74.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.74.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.74.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.74.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.74.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.74.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.75.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.75.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.75.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.75.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.75.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.75.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.76.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.76.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.76.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.76.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.76.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.76.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.77.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.77.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.77.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.77.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.77.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.77.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.78.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.78.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.78.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.78.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.78.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.78.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.79.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.79.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.79.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.79.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.79.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.79.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.8.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.8.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.8.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.8.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.8.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.8.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.80.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.80.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.80.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.80.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.80.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.80.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.81.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.81.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.81.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.81.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.81.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.81.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.82.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.82.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.82.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.82.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.82.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.82.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.83.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.83.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.83.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.83.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.83.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.83.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.84.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.84.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.84.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.84.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.84.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.84.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.85.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.85.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.85.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.85.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.85.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.85.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.86.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.86.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.86.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.86.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.86.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.86.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.87.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.87.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.87.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.87.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.87.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.87.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.88.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.88.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.88.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.88.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.88.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.88.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.89.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.89.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.89.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.89.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.89.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.89.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.9.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.9.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.9.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.9.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.9.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.9.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.90.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.90.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.90.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.90.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.90.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.90.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.91.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.91.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.91.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.91.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.91.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.91.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.92.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.92.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.92.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.92.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.92.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.92.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.93.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.93.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.93.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.93.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.93.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.93.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.94.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.94.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.94.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.94.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.94.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.94.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.95.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.95.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.95.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.95.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.95.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.95.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.96.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.96.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.96.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.96.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.96.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.96.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.97.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.97.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.97.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.97.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.97.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.97.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.98.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.98.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.98.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.98.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.98.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.98.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.99.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.99.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.99.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.99.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.99.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.experts.99.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.gate.e_score_correction_bias": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.gate.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.shared_experts.down_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.shared_experts.down_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.shared_experts.gate_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.shared_experts.gate_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.shared_experts.up_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.mlp.shared_experts.up_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.post_attention_layernorm.weight": "model-00089-of-00092.safetensors", + "model.layers.88.self_attn.k_norm.weight": "model-00089-of-00092.safetensors", + "model.layers.88.self_attn.k_proj.bias": "model-00089-of-00092.safetensors", + "model.layers.88.self_attn.k_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.self_attn.k_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.self_attn.o_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.self_attn.o_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.self_attn.q_norm.weight": "model-00089-of-00092.safetensors", + "model.layers.88.self_attn.q_proj.bias": "model-00089-of-00092.safetensors", + "model.layers.88.self_attn.q_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.self_attn.q_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.88.self_attn.v_proj.bias": "model-00089-of-00092.safetensors", + "model.layers.88.self_attn.v_proj.weight": "model-00089-of-00092.safetensors", + "model.layers.88.self_attn.v_proj.weight_scale": "model-00089-of-00092.safetensors", + "model.layers.89.input_layernorm.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.0.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.0.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.0.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.0.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.0.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.0.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.1.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.1.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.1.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.1.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.1.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.1.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.10.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.10.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.10.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.10.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.10.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.10.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.100.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.100.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.100.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.100.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.100.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.100.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.101.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.101.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.101.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.101.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.101.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.101.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.102.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.102.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.102.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.102.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.102.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.102.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.103.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.103.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.103.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.103.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.103.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.103.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.104.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.104.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.104.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.104.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.104.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.104.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.105.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.105.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.105.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.105.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.105.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.105.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.106.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.106.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.106.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.106.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.106.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.106.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.107.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.107.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.107.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.107.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.107.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.107.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.108.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.108.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.108.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.108.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.108.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.108.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.109.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.109.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.109.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.109.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.109.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.109.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.11.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.11.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.11.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.11.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.11.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.11.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.110.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.110.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.110.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.110.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.110.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.110.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.111.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.111.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.111.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.111.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.111.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.111.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.112.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.112.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.112.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.112.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.112.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.112.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.113.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.113.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.113.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.113.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.113.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.113.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.114.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.114.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.114.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.114.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.114.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.114.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.115.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.115.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.115.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.115.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.115.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.115.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.116.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.116.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.116.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.116.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.116.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.116.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.117.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.117.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.117.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.117.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.117.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.117.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.118.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.118.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.118.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.118.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.118.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.118.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.119.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.119.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.119.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.119.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.119.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.119.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.12.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.12.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.12.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.12.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.12.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.12.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.120.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.120.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.120.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.120.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.120.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.120.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.121.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.121.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.121.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.121.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.121.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.121.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.122.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.122.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.122.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.122.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.122.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.122.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.123.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.123.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.123.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.123.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.123.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.123.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.124.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.124.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.124.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.124.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.124.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.124.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.125.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.125.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.125.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.125.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.125.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.125.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.126.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.126.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.126.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.126.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.126.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.126.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.127.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.127.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.127.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.127.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.127.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.127.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.128.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.128.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.128.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.128.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.128.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.128.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.129.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.129.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.129.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.129.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.129.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.129.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.13.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.13.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.13.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.13.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.13.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.13.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.130.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.130.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.130.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.130.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.130.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.130.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.131.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.131.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.131.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.131.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.131.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.131.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.132.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.132.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.132.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.132.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.132.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.132.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.133.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.133.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.133.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.133.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.133.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.133.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.134.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.134.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.134.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.134.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.134.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.134.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.135.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.135.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.135.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.135.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.135.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.135.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.136.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.136.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.136.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.136.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.136.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.136.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.137.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.137.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.137.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.137.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.137.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.137.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.138.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.138.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.138.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.138.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.138.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.138.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.139.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.139.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.139.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.139.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.139.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.139.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.14.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.14.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.14.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.14.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.14.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.14.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.140.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.140.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.140.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.140.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.140.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.140.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.141.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.141.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.141.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.141.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.141.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.141.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.142.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.142.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.142.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.142.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.142.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.142.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.143.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.143.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.143.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.143.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.143.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.143.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.144.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.144.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.144.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.144.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.144.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.144.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.145.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.145.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.145.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.145.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.145.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.145.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.146.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.146.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.146.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.146.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.146.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.146.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.147.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.147.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.147.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.147.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.147.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.147.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.148.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.148.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.148.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.148.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.148.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.148.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.149.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.149.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.149.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.149.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.149.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.149.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.15.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.15.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.15.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.15.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.15.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.15.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.150.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.150.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.150.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.150.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.150.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.150.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.151.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.151.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.151.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.151.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.151.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.151.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.152.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.152.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.152.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.152.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.152.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.152.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.153.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.153.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.153.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.153.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.153.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.153.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.154.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.154.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.154.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.154.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.154.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.154.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.155.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.155.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.155.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.155.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.155.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.155.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.156.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.156.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.156.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.156.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.156.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.156.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.157.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.157.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.157.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.157.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.157.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.157.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.158.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.158.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.158.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.158.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.158.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.158.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.159.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.159.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.159.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.159.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.159.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.159.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.16.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.16.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.16.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.16.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.16.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.16.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.17.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.17.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.17.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.17.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.17.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.17.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.18.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.18.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.18.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.18.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.18.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.18.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.19.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.19.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.19.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.19.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.19.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.19.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.2.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.2.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.2.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.2.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.2.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.2.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.20.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.20.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.20.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.20.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.20.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.20.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.21.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.21.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.21.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.21.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.21.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.21.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.22.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.22.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.22.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.22.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.22.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.22.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.23.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.23.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.23.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.23.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.23.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.23.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.24.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.24.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.24.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.24.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.24.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.24.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.25.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.25.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.25.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.25.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.25.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.25.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.26.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.26.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.26.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.26.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.26.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.26.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.27.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.27.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.27.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.27.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.27.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.27.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.28.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.28.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.28.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.28.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.28.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.28.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.29.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.29.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.29.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.29.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.29.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.29.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.3.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.3.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.3.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.3.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.3.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.3.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.30.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.30.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.30.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.30.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.30.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.30.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.31.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.31.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.31.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.31.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.31.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.31.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.32.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.32.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.32.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.32.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.32.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.32.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.33.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.33.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.33.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.33.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.33.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.33.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.34.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.34.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.34.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.34.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.34.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.34.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.35.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.35.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.35.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.35.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.35.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.35.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.36.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.36.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.36.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.36.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.36.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.36.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.37.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.37.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.37.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.37.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.37.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.37.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.38.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.38.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.38.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.38.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.38.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.38.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.39.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.39.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.39.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.39.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.39.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.39.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.4.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.4.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.4.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.4.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.4.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.4.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.40.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.40.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.40.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.40.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.40.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.40.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.41.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.41.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.41.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.41.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.41.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.41.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.42.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.42.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.42.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.42.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.42.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.42.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.43.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.43.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.43.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.43.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.43.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.43.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.44.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.44.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.44.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.44.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.44.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.44.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.45.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.45.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.45.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.45.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.45.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.45.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.46.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.46.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.46.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.46.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.46.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.46.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.47.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.47.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.47.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.47.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.47.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.47.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.48.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.48.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.48.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.48.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.48.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.48.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.49.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.49.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.49.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.49.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.49.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.49.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.5.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.5.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.5.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.5.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.5.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.5.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.50.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.50.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.50.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.50.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.50.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.50.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.51.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.51.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.51.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.51.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.51.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.51.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.52.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.52.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.52.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.52.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.52.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.52.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.53.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.53.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.53.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.53.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.53.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.53.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.54.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.54.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.54.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.54.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.54.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.54.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.55.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.55.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.55.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.55.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.55.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.55.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.56.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.56.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.56.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.56.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.56.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.56.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.57.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.57.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.57.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.57.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.57.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.57.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.58.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.58.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.58.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.58.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.58.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.58.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.59.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.59.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.59.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.59.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.59.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.59.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.6.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.6.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.6.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.6.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.6.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.6.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.60.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.60.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.60.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.60.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.60.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.60.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.61.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.61.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.61.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.61.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.61.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.61.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.62.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.62.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.62.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.62.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.62.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.62.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.63.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.63.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.63.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.63.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.63.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.63.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.64.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.64.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.64.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.64.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.64.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.64.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.65.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.65.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.65.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.65.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.65.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.65.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.66.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.66.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.66.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.66.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.66.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.66.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.67.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.67.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.67.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.67.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.67.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.67.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.68.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.68.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.68.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.68.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.68.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.68.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.69.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.69.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.69.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.69.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.69.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.69.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.7.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.7.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.7.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.7.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.7.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.7.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.70.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.70.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.70.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.70.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.70.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.70.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.71.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.71.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.71.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.71.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.71.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.71.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.72.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.72.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.72.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.72.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.72.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.72.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.73.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.73.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.73.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.73.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.73.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.73.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.74.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.74.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.74.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.74.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.74.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.74.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.75.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.75.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.75.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.75.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.75.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.75.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.76.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.76.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.76.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.76.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.76.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.76.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.77.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.77.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.77.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.77.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.77.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.77.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.78.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.78.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.78.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.78.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.78.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.78.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.79.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.79.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.79.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.79.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.79.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.79.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.8.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.8.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.8.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.8.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.8.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.8.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.80.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.80.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.80.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.80.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.80.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.80.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.81.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.81.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.81.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.81.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.81.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.81.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.82.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.82.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.82.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.82.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.82.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.82.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.83.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.83.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.83.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.83.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.83.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.83.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.84.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.84.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.84.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.84.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.84.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.84.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.85.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.85.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.85.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.85.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.85.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.85.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.86.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.86.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.86.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.86.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.86.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.86.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.87.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.87.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.87.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.87.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.87.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.87.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.88.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.88.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.88.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.88.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.88.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.88.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.89.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.89.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.89.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.89.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.89.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.89.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.9.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.9.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.9.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.9.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.9.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.9.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.90.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.90.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.90.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.90.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.90.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.90.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.91.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.91.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.91.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.91.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.91.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.91.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.92.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.92.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.92.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.92.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.92.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.92.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.93.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.93.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.93.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.93.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.93.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.93.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.94.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.94.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.94.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.94.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.94.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.94.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.95.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.95.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.95.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.95.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.95.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.95.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.96.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.96.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.96.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.96.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.96.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.96.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.97.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.97.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.97.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.97.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.97.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.97.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.98.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.98.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.98.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.98.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.98.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.98.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.99.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.99.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.99.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.99.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.99.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.experts.99.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.gate.e_score_correction_bias": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.gate.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.shared_experts.down_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.shared_experts.down_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.shared_experts.gate_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.shared_experts.gate_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.shared_experts.up_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.mlp.shared_experts.up_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.post_attention_layernorm.weight": "model-00090-of-00092.safetensors", + "model.layers.89.self_attn.k_norm.weight": "model-00090-of-00092.safetensors", + "model.layers.89.self_attn.k_proj.bias": "model-00090-of-00092.safetensors", + "model.layers.89.self_attn.k_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.self_attn.k_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.self_attn.o_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.self_attn.o_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.self_attn.q_norm.weight": "model-00090-of-00092.safetensors", + "model.layers.89.self_attn.q_proj.bias": "model-00090-of-00092.safetensors", + "model.layers.89.self_attn.q_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.self_attn.q_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.89.self_attn.v_proj.bias": "model-00090-of-00092.safetensors", + "model.layers.89.self_attn.v_proj.weight": "model-00090-of-00092.safetensors", + "model.layers.89.self_attn.v_proj.weight_scale": "model-00090-of-00092.safetensors", + "model.layers.90.input_layernorm.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.0.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.0.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.0.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.0.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.0.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.0.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.1.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.1.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.1.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.1.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.1.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.1.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.10.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.10.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.10.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.10.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.10.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.10.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.100.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.100.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.100.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.100.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.100.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.100.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.101.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.101.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.101.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.101.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.101.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.101.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.102.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.102.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.102.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.102.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.102.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.102.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.103.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.103.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.103.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.103.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.103.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.103.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.104.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.104.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.104.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.104.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.104.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.104.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.105.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.105.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.105.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.105.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.105.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.105.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.106.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.106.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.106.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.106.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.106.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.106.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.107.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.107.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.107.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.107.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.107.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.107.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.108.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.108.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.108.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.108.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.108.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.108.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.109.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.109.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.109.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.109.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.109.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.109.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.11.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.11.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.11.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.11.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.11.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.11.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.110.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.110.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.110.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.110.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.110.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.110.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.111.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.111.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.111.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.111.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.111.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.111.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.112.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.112.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.112.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.112.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.112.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.112.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.113.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.113.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.113.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.113.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.113.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.113.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.114.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.114.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.114.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.114.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.114.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.114.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.115.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.115.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.115.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.115.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.115.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.115.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.116.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.116.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.116.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.116.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.116.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.116.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.117.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.117.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.117.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.117.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.117.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.117.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.118.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.118.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.118.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.118.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.118.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.118.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.119.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.119.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.119.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.119.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.119.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.119.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.12.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.12.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.12.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.12.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.12.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.12.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.120.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.120.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.120.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.120.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.120.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.120.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.121.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.121.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.121.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.121.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.121.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.121.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.122.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.122.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.122.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.122.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.122.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.122.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.123.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.123.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.123.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.123.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.123.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.123.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.124.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.124.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.124.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.124.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.124.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.124.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.125.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.125.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.125.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.125.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.125.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.125.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.126.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.126.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.126.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.126.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.126.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.126.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.127.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.127.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.127.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.127.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.127.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.127.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.128.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.128.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.128.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.128.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.128.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.128.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.129.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.129.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.129.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.129.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.129.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.129.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.13.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.13.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.13.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.13.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.13.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.13.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.130.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.130.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.130.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.130.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.130.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.130.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.131.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.131.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.131.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.131.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.131.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.131.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.132.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.132.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.132.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.132.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.132.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.132.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.133.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.133.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.133.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.133.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.133.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.133.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.134.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.134.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.134.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.134.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.134.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.134.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.135.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.135.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.135.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.135.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.135.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.135.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.136.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.136.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.136.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.136.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.136.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.136.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.137.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.137.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.137.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.137.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.137.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.137.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.138.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.138.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.138.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.138.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.138.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.138.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.139.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.139.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.139.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.139.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.139.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.139.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.14.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.14.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.14.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.14.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.14.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.14.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.140.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.140.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.140.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.140.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.140.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.140.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.141.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.141.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.141.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.141.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.141.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.141.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.142.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.142.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.142.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.142.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.142.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.142.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.143.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.143.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.143.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.143.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.143.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.143.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.144.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.144.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.144.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.144.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.144.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.144.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.145.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.145.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.145.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.145.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.145.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.145.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.146.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.146.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.146.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.146.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.146.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.146.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.147.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.147.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.147.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.147.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.147.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.147.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.148.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.148.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.148.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.148.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.148.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.148.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.149.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.149.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.149.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.149.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.149.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.149.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.15.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.15.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.15.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.15.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.15.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.15.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.150.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.150.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.150.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.150.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.150.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.150.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.151.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.151.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.151.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.151.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.151.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.151.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.152.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.152.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.152.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.152.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.152.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.152.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.153.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.153.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.153.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.153.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.153.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.153.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.154.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.154.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.154.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.154.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.154.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.154.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.155.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.155.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.155.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.155.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.155.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.155.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.156.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.156.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.156.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.156.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.156.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.156.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.157.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.157.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.157.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.157.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.157.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.157.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.158.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.158.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.158.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.158.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.158.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.158.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.159.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.159.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.159.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.159.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.159.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.159.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.16.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.16.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.16.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.16.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.16.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.16.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.17.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.17.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.17.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.17.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.17.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.17.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.18.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.18.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.18.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.18.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.18.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.18.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.19.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.19.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.19.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.19.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.19.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.19.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.2.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.2.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.2.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.2.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.2.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.2.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.20.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.20.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.20.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.20.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.20.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.20.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.21.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.21.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.21.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.21.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.21.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.21.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.22.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.22.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.22.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.22.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.22.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.22.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.23.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.23.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.23.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.23.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.23.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.23.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.24.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.24.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.24.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.24.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.24.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.24.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.25.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.25.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.25.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.25.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.25.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.25.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.26.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.26.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.26.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.26.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.26.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.26.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.27.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.27.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.27.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.27.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.27.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.27.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.28.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.28.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.28.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.28.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.28.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.28.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.29.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.29.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.29.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.29.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.29.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.29.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.3.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.3.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.3.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.3.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.3.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.3.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.30.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.30.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.30.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.30.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.30.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.30.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.31.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.31.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.31.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.31.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.31.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.31.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.32.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.32.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.32.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.32.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.32.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.32.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.33.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.33.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.33.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.33.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.33.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.33.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.34.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.34.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.34.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.34.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.34.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.34.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.35.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.35.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.35.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.35.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.35.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.35.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.36.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.36.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.36.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.36.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.36.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.36.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.37.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.37.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.37.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.37.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.37.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.37.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.38.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.38.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.38.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.38.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.38.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.38.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.39.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.39.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.39.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.39.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.39.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.39.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.4.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.4.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.4.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.4.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.4.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.4.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.40.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.40.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.40.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.40.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.40.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.40.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.41.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.41.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.41.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.41.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.41.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.41.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.42.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.42.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.42.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.42.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.42.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.42.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.43.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.43.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.43.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.43.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.43.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.43.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.44.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.44.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.44.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.44.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.44.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.44.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.45.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.45.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.45.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.45.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.45.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.45.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.46.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.46.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.46.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.46.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.46.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.46.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.47.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.47.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.47.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.47.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.47.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.47.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.48.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.48.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.48.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.48.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.48.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.48.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.49.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.49.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.49.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.49.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.49.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.49.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.5.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.5.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.5.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.5.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.5.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.5.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.50.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.50.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.50.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.50.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.50.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.50.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.51.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.51.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.51.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.51.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.51.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.51.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.52.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.52.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.52.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.52.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.52.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.52.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.53.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.53.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.53.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.53.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.53.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.53.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.54.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.54.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.54.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.54.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.54.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.54.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.55.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.55.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.55.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.55.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.55.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.55.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.56.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.56.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.56.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.56.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.56.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.56.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.57.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.57.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.57.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.57.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.57.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.57.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.58.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.58.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.58.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.58.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.58.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.58.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.59.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.59.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.59.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.59.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.59.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.59.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.6.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.6.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.6.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.6.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.6.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.6.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.60.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.60.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.60.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.60.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.60.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.60.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.61.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.61.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.61.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.61.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.61.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.61.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.62.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.62.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.62.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.62.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.62.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.62.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.63.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.63.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.63.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.63.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.63.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.63.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.64.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.64.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.64.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.64.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.64.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.64.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.65.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.65.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.65.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.65.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.65.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.65.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.66.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.66.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.66.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.66.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.66.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.66.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.67.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.67.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.67.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.67.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.67.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.67.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.68.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.68.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.68.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.68.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.68.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.68.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.69.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.69.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.69.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.69.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.69.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.69.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.7.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.7.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.7.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.7.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.7.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.7.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.70.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.70.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.70.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.70.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.70.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.70.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.71.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.71.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.71.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.71.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.71.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.71.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.72.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.72.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.72.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.72.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.72.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.72.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.73.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.73.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.73.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.73.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.73.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.73.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.74.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.74.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.74.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.74.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.74.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.74.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.75.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.75.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.75.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.75.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.75.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.75.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.76.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.76.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.76.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.76.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.76.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.76.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.77.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.77.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.77.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.77.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.77.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.77.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.78.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.78.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.78.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.78.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.78.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.78.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.79.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.79.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.79.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.79.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.79.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.79.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.8.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.8.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.8.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.8.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.8.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.8.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.80.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.80.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.80.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.80.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.80.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.80.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.81.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.81.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.81.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.81.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.81.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.81.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.82.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.82.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.82.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.82.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.82.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.82.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.83.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.83.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.83.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.83.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.83.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.83.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.84.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.84.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.84.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.84.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.84.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.84.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.85.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.85.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.85.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.85.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.85.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.85.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.86.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.86.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.86.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.86.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.86.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.86.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.87.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.87.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.87.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.87.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.87.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.87.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.88.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.88.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.88.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.88.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.88.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.88.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.89.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.89.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.89.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.89.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.89.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.89.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.9.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.9.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.9.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.9.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.9.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.9.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.90.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.90.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.90.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.90.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.90.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.90.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.91.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.91.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.91.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.91.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.91.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.91.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.92.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.92.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.92.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.92.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.92.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.92.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.93.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.93.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.93.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.93.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.93.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.93.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.94.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.94.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.94.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.94.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.94.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.94.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.95.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.95.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.95.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.95.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.95.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.95.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.96.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.96.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.96.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.96.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.96.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.96.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.97.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.97.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.97.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.97.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.97.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.97.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.98.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.98.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.98.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.98.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.98.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.98.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.99.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.99.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.99.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.99.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.99.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.experts.99.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.gate.e_score_correction_bias": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.gate.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.shared_experts.down_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.shared_experts.down_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.shared_experts.gate_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.shared_experts.gate_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.shared_experts.up_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.mlp.shared_experts.up_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.post_attention_layernorm.weight": "model-00091-of-00092.safetensors", + "model.layers.90.self_attn.k_norm.weight": "model-00091-of-00092.safetensors", + "model.layers.90.self_attn.k_proj.bias": "model-00091-of-00092.safetensors", + "model.layers.90.self_attn.k_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.self_attn.k_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.self_attn.o_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.self_attn.o_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.self_attn.q_norm.weight": "model-00091-of-00092.safetensors", + "model.layers.90.self_attn.q_proj.bias": "model-00091-of-00092.safetensors", + "model.layers.90.self_attn.q_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.self_attn.q_proj.weight_scale": "model-00091-of-00092.safetensors", + "model.layers.90.self_attn.v_proj.bias": "model-00091-of-00092.safetensors", + "model.layers.90.self_attn.v_proj.weight": "model-00091-of-00092.safetensors", + "model.layers.90.self_attn.v_proj.weight_scale": "model-00091-of-00092.safetensors", + "lm_head.weight": "model-00092-of-00092.safetensors", + "model.layers.91.input_layernorm.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.0.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.0.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.0.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.0.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.0.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.0.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.1.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.1.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.1.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.1.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.1.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.1.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.10.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.10.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.10.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.10.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.10.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.10.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.100.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.100.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.100.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.100.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.100.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.100.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.101.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.101.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.101.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.101.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.101.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.101.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.102.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.102.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.102.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.102.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.102.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.102.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.103.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.103.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.103.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.103.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.103.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.103.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.104.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.104.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.104.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.104.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.104.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.104.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.105.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.105.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.105.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.105.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.105.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.105.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.106.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.106.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.106.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.106.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.106.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.106.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.107.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.107.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.107.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.107.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.107.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.107.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.108.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.108.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.108.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.108.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.108.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.108.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.109.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.109.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.109.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.109.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.109.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.109.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.11.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.11.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.11.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.11.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.11.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.11.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.110.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.110.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.110.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.110.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.110.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.110.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.111.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.111.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.111.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.111.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.111.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.111.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.112.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.112.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.112.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.112.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.112.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.112.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.113.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.113.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.113.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.113.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.113.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.113.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.114.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.114.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.114.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.114.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.114.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.114.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.115.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.115.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.115.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.115.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.115.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.115.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.116.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.116.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.116.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.116.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.116.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.116.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.117.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.117.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.117.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.117.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.117.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.117.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.118.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.118.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.118.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.118.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.118.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.118.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.119.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.119.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.119.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.119.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.119.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.119.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.12.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.12.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.12.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.12.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.12.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.12.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.120.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.120.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.120.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.120.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.120.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.120.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.121.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.121.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.121.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.121.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.121.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.121.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.122.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.122.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.122.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.122.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.122.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.122.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.123.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.123.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.123.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.123.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.123.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.123.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.124.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.124.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.124.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.124.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.124.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.124.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.125.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.125.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.125.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.125.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.125.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.125.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.126.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.126.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.126.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.126.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.126.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.126.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.127.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.127.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.127.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.127.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.127.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.127.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.128.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.128.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.128.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.128.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.128.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.128.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.129.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.129.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.129.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.129.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.129.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.129.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.13.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.13.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.13.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.13.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.13.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.13.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.130.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.130.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.130.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.130.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.130.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.130.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.131.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.131.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.131.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.131.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.131.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.131.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.132.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.132.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.132.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.132.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.132.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.132.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.133.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.133.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.133.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.133.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.133.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.133.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.134.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.134.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.134.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.134.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.134.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.134.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.135.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.135.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.135.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.135.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.135.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.135.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.136.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.136.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.136.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.136.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.136.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.136.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.137.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.137.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.137.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.137.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.137.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.137.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.138.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.138.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.138.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.138.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.138.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.138.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.139.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.139.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.139.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.139.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.139.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.139.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.14.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.14.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.14.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.14.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.14.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.14.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.140.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.140.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.140.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.140.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.140.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.140.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.141.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.141.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.141.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.141.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.141.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.141.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.142.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.142.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.142.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.142.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.142.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.142.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.143.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.143.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.143.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.143.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.143.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.143.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.144.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.144.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.144.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.144.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.144.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.144.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.145.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.145.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.145.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.145.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.145.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.145.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.146.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.146.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.146.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.146.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.146.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.146.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.147.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.147.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.147.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.147.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.147.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.147.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.148.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.148.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.148.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.148.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.148.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.148.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.149.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.149.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.149.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.149.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.149.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.149.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.15.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.15.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.15.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.15.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.15.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.15.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.150.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.150.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.150.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.150.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.150.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.150.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.151.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.151.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.151.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.151.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.151.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.151.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.152.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.152.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.152.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.152.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.152.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.152.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.153.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.153.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.153.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.153.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.153.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.153.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.154.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.154.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.154.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.154.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.154.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.154.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.155.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.155.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.155.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.155.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.155.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.155.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.156.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.156.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.156.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.156.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.156.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.156.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.157.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.157.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.157.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.157.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.157.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.157.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.158.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.158.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.158.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.158.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.158.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.158.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.159.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.159.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.159.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.159.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.159.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.159.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.16.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.16.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.16.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.16.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.16.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.16.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.17.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.17.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.17.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.17.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.17.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.17.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.18.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.18.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.18.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.18.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.18.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.18.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.19.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.19.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.19.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.19.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.19.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.19.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.2.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.2.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.2.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.2.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.2.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.2.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.20.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.20.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.20.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.20.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.20.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.20.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.21.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.21.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.21.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.21.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.21.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.21.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.22.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.22.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.22.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.22.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.22.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.22.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.23.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.23.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.23.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.23.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.23.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.23.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.24.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.24.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.24.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.24.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.24.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.24.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.25.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.25.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.25.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.25.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.25.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.25.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.26.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.26.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.26.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.26.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.26.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.26.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.27.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.27.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.27.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.27.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.27.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.27.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.28.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.28.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.28.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.28.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.28.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.28.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.29.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.29.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.29.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.29.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.29.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.29.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.3.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.3.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.3.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.3.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.3.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.3.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.30.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.30.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.30.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.30.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.30.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.30.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.31.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.31.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.31.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.31.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.31.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.31.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.32.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.32.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.32.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.32.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.32.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.32.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.33.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.33.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.33.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.33.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.33.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.33.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.34.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.34.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.34.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.34.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.34.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.34.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.35.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.35.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.35.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.35.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.35.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.35.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.36.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.36.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.36.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.36.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.36.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.36.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.37.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.37.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.37.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.37.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.37.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.37.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.38.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.38.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.38.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.38.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.38.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.38.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.39.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.39.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.39.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.39.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.39.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.39.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.4.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.4.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.4.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.4.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.4.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.4.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.40.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.40.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.40.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.40.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.40.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.40.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.41.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.41.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.41.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.41.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.41.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.41.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.42.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.42.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.42.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.42.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.42.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.42.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.43.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.43.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.43.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.43.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.43.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.43.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.44.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.44.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.44.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.44.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.44.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.44.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.45.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.45.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.45.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.45.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.45.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.45.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.46.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.46.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.46.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.46.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.46.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.46.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.47.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.47.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.47.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.47.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.47.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.47.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.48.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.48.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.48.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.48.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.48.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.48.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.49.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.49.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.49.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.49.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.49.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.49.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.5.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.5.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.5.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.5.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.5.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.5.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.50.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.50.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.50.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.50.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.50.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.50.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.51.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.51.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.51.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.51.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.51.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.51.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.52.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.52.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.52.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.52.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.52.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.52.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.53.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.53.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.53.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.53.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.53.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.53.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.54.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.54.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.54.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.54.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.54.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.54.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.55.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.55.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.55.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.55.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.55.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.55.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.56.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.56.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.56.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.56.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.56.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.56.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.57.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.57.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.57.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.57.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.57.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.57.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.58.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.58.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.58.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.58.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.58.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.58.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.59.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.59.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.59.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.59.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.59.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.59.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.6.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.6.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.6.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.6.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.6.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.6.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.60.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.60.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.60.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.60.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.60.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.60.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.61.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.61.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.61.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.61.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.61.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.61.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.62.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.62.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.62.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.62.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.62.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.62.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.63.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.63.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.63.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.63.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.63.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.63.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.64.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.64.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.64.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.64.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.64.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.64.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.65.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.65.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.65.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.65.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.65.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.65.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.66.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.66.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.66.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.66.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.66.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.66.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.67.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.67.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.67.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.67.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.67.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.67.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.68.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.68.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.68.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.68.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.68.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.68.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.69.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.69.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.69.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.69.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.69.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.69.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.7.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.7.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.7.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.7.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.7.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.7.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.70.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.70.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.70.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.70.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.70.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.70.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.71.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.71.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.71.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.71.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.71.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.71.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.72.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.72.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.72.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.72.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.72.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.72.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.73.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.73.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.73.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.73.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.73.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.73.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.74.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.74.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.74.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.74.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.74.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.74.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.75.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.75.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.75.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.75.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.75.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.75.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.76.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.76.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.76.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.76.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.76.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.76.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.77.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.77.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.77.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.77.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.77.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.77.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.78.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.78.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.78.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.78.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.78.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.78.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.79.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.79.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.79.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.79.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.79.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.79.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.8.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.8.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.8.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.8.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.8.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.8.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.80.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.80.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.80.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.80.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.80.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.80.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.81.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.81.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.81.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.81.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.81.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.81.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.82.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.82.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.82.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.82.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.82.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.82.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.83.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.83.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.83.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.83.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.83.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.83.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.84.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.84.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.84.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.84.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.84.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.84.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.85.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.85.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.85.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.85.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.85.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.85.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.86.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.86.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.86.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.86.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.86.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.86.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.87.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.87.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.87.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.87.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.87.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.87.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.88.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.88.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.88.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.88.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.88.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.88.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.89.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.89.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.89.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.89.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.89.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.89.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.9.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.9.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.9.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.9.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.9.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.9.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.90.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.90.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.90.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.90.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.90.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.90.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.91.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.91.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.91.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.91.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.91.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.91.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.92.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.92.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.92.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.92.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.92.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.92.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.93.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.93.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.93.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.93.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.93.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.93.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.94.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.94.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.94.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.94.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.94.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.94.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.95.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.95.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.95.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.95.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.95.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.95.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.96.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.96.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.96.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.96.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.96.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.96.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.97.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.97.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.97.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.97.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.97.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.97.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.98.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.98.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.98.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.98.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.98.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.98.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.99.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.99.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.99.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.99.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.99.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.experts.99.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.gate.e_score_correction_bias": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.gate.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.shared_experts.down_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.shared_experts.down_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.shared_experts.gate_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.shared_experts.gate_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.shared_experts.up_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.mlp.shared_experts.up_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.post_attention_layernorm.weight": "model-00092-of-00092.safetensors", + "model.layers.91.self_attn.k_norm.weight": "model-00092-of-00092.safetensors", + "model.layers.91.self_attn.k_proj.bias": "model-00092-of-00092.safetensors", + "model.layers.91.self_attn.k_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.self_attn.k_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.self_attn.o_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.self_attn.o_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.self_attn.q_norm.weight": "model-00092-of-00092.safetensors", + "model.layers.91.self_attn.q_proj.bias": "model-00092-of-00092.safetensors", + "model.layers.91.self_attn.q_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.self_attn.q_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.layers.91.self_attn.v_proj.bias": "model-00092-of-00092.safetensors", + "model.layers.91.self_attn.v_proj.weight": "model-00092-of-00092.safetensors", + "model.layers.91.self_attn.v_proj.weight_scale": "model-00092-of-00092.safetensors", + "model.norm.weight": "model-00092-of-00092.safetensors" + }, + "metadata": { + "total_size": 241145664 + } +} \ No newline at end of file diff --git a/tokenizer.json b/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..43a71efad1ab3f7e4d66d1e48e7cc44f68f21f3a --- /dev/null +++ b/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9340665016419c825c4bdabbcc9acc43b7ca2c68ce142724afa829abb1be5efd +size 19970699 diff --git a/tokenizer_config.json b/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..053f12c9b03d5acbcc921042ea0c87a6baa5d3f7 --- /dev/null +++ b/tokenizer_config.json @@ -0,0 +1,325 @@ +{ + "added_tokens_decoder": { + "151329": { + "content": "<|endoftext|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151330": { + "content": "[MASK]", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151331": { + "content": "[gMASK]", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151332": { + "content": "[sMASK]", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151333": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151334": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151335": { + "content": "<|system|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151336": { + "content": "<|user|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151337": { + "content": "<|assistant|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151338": { + "content": "<|observation|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151339": { + "content": "<|begin_of_image|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151340": { + "content": "<|end_of_image|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151341": { + "content": "<|begin_of_video|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151342": { + "content": "<|end_of_video|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151343": { + "content": "<|begin_of_audio|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151344": { + "content": "<|end_of_audio|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151345": { + "content": "<|begin_of_transcription|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151346": { + "content": "<|end_of_transcription|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151347": { + "content": "<|code_prefix|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151348": { + "content": "<|code_middle|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151349": { + "content": "<|code_suffix|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151350": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151351": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151352": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151353": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151354": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151355": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151356": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151357": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151358": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151359": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151360": { + "content": "/nothink", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151361": { + "content": "<|begin_of_box|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151362": { + "content": "<|end_of_box|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151363": { + "content": "<|image|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151364": { + "content": "<|video|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + } + }, + "additional_special_tokens": [ + "<|endoftext|>", + "[MASK]", + "[gMASK]", + "[sMASK]", + "", + "", + "<|system|>", + "<|user|>", + "<|assistant|>", + "<|observation|>", + "<|begin_of_image|>", + "<|end_of_image|>", + "<|begin_of_video|>", + "<|end_of_video|>", + "<|begin_of_audio|>", + "<|end_of_audio|>", + "<|begin_of_transcription|>", + "<|end_of_transcription|>", + "<|code_prefix|>", + "<|code_middle|>", + "<|code_suffix|>", + "/nothink" + ], + "clean_up_tokenization_spaces": false, + "do_lower_case": false, + "eos_token": "<|endoftext|>", + "extra_special_tokens": {}, + "model_max_length": 128000, + "pad_token": "<|endoftext|>", + "padding_side": "left", + "remove_space": false, + "tokenizer_class": "PreTrainedTokenizer" +}